From 3052c10566951d3076d675a4a07f28f8baacb2fc Mon Sep 17 00:00:00 2001 From: Henry Jin Date: Fri, 26 Jun 2020 07:54:45 -0700 Subject: [PATCH] v5.0.1 release --- Chap_memory_model.tex | 17 +- Chap_tasking.tex | 5 +- Examples_Chapt.tex | 5 + Examples_SIMD.tex | 32 +- Examples_acquire_release.tex | 16 +- Examples_affinity.tex | 20 +- Examples_affinity_display.tex | 12 +- Examples_affinity_query.tex | 4 +- Examples_allocators.tex | 4 +- Examples_array_sections.tex | 16 +- Examples_array_shaping.tex | 10 +- Examples_associate.tex | 6 +- Examples_async_target_nowait.tex | 4 +- Examples_async_target_nowait_depend.tex | 4 +- Examples_async_target_with_tasks.tex | 8 +- Examples_atomic.tex | 12 +- Examples_atomic_restrict.tex | 10 +- Examples_cancellation.tex | 8 +- Examples_collapse.tex | 12 +- Examples_cpp_reference.tex | 2 +- Examples_critical.tex | 2 +- Examples_declare_target.tex | 24 +- Examples_depobj.tex | 4 +- Examples_device.tex | 14 +- Examples_doacross.tex | 16 +- Examples_host_teams.tex | 4 +- Examples_init_lock_with_hint.tex | 4 +- Examples_lastprivate.tex | 10 + Examples_linear_in_loop.tex | 4 +- Examples_linear_modifier.tex | 76 + Examples_loop.tex | 4 +- Examples_mem_model.tex | 59 +- Examples_metadirective.tex | 12 +- Examples_parallel_master_taskloop.tex | 4 +- Examples_pra_iterator.tex | 2 +- Examples_reduction.tex | 159 +- Examples_requires.tex | 4 +- Examples_scan.tex | 38 + Examples_standalone.tex | 8 +- Examples_target.tex | 31 +- Examples_target_data.tex | 28 +- Examples_target_defaultmap.tex | 56 + Examples_target_mapper.tex | 16 +- Examples_target_offload.tex | 4 +- Examples_target_pointer_mapping.tex | 85 +- Examples_target_structure_mapping.tex | 4 +- Examples_target_unstructured_data.tex | 6 +- Examples_target_update.tex | 8 +- Examples_task_affinity.tex | 4 +- Examples_task_dep.tex | 69 +- Examples_task_priority.tex | 4 +- Examples_taskgroup.tex | 4 +- Examples_tasking.tex | 59 +- Examples_taskloop.tex | 8 +- Examples_taskyield.tex | 4 +- Examples_teams.tex | 24 +- Examples_udr.tex | 19 +- Examples_variant.tex | 8 +- Foreword_Chapt.tex | 4 +- History.tex | 48 +- Makefile | 48 +- README | 24 +- Title_Page.tex | 2 +- latexdiff.cfg | 5 + openmp-example.tex | 4 +- openmp-examples.tex | 8 +- openmp.sty | 59 +- sources/Example_SIMD.1.c | 1 + sources/Example_SIMD.1.f90 | 1 + sources/Example_SIMD.2.c | 1 + sources/Example_SIMD.2.f90 | 5 +- sources/Example_SIMD.3.c | 1 + sources/Example_SIMD.3.f90 | 1 + sources/Example_SIMD.4.c | 1 + sources/Example_SIMD.4.f90 | 1 + sources/Example_SIMD.5.c | 1 + sources/Example_SIMD.5.f90 | 1 + sources/Example_SIMD.6.c | 1 + sources/Example_SIMD.6.f90 | 5 +- sources/Example_SIMD.7.c | 1 + sources/Example_SIMD.7.f90 | 3 +- sources/Example_SIMD.8.c | 1 + sources/Example_SIMD.8.f90 | 1 + sources/Example_acquire_release.1.c | 3 +- sources/Example_acquire_release.1.f90 | 3 +- sources/Example_acquire_release.2.c | 3 +- sources/Example_acquire_release.2.f90 | 3 +- sources/Example_acquire_release.3.c | 3 +- sources/Example_acquire_release.3.f90 | 3 +- sources/Example_acquire_release_broke.4.c | 3 +- sources/Example_acquire_release_broke.4.f90 | 5 +- sources/Example_affinity.1.c | 1 + sources/Example_affinity.1.f | 1 + sources/Example_affinity.2.c | 1 + sources/Example_affinity.2.f90 | 1 + sources/Example_affinity.3.c | 1 + sources/Example_affinity.3.f | 1 + sources/Example_affinity.4.c | 1 + sources/Example_affinity.4.f90 | 1 + sources/Example_affinity.5.c | 1 + sources/Example_affinity.5.f | 1 + sources/Example_affinity.6.c | 3 +- sources/Example_affinity.6.f90 | 1 + sources/Example_affinity_display.1.c | 1 + sources/Example_affinity_display.1.f90 | 4 +- sources/Example_affinity_display.2.c | 1 + sources/Example_affinity_display.2.f90 | 5 +- sources/Example_affinity_display.3.c | 3 +- sources/Example_affinity_display.3.f90 | 4 +- sources/Example_affinity_query.1.c | 1 + sources/Example_affinity_query.1.f90 | 2 + sources/Example_allocators.1.c | 3 +- sources/Example_allocators.1.f90 | 3 +- sources/Example_array_sections.1.c | 1 + sources/Example_array_sections.1.f90 | 1 + sources/Example_array_sections.2.c | 1 + sources/Example_array_sections.2.f90 | 1 + sources/Example_array_sections.3.c | 1 + sources/Example_array_sections.3.f90 | 1 + sources/Example_array_sections.4.c | 1 + sources/Example_array_sections.4.f90 | 1 + sources/Example_array_shaping.1.c | 3 +- sources/Example_array_shaping.1.f90 | 60 + sources/Example_associate.1.f | 3 +- sources/Example_associate.2.f | 1 + sources/Example_associate.3.f90 | 1 + sources/Example_async_target.1.c | 1 + sources/Example_async_target.1.f90 | 1 + sources/Example_async_target.2.c | 1 + sources/Example_async_target.2.f90 | 1 + sources/Example_async_target.3.c | 1 + sources/Example_async_target.3.f90 | 1 + sources/Example_async_target.4.c | 1 + sources/Example_async_target.4.f90 | 1 + sources/Example_atomic.1.c | 1 + sources/Example_atomic.1.f | 1 + sources/Example_atomic.2.c | 1 + sources/Example_atomic.2.f | 1 + sources/Example_atomic.3.c | 1 + sources/Example_atomic.3.f | 1 + sources/Example_atomic_restrict.1.c | 1 + sources/Example_atomic_restrict.1.f | 1 + sources/Example_atomic_restrict.2.c | 1 + sources/Example_atomic_restrict.2.f | 1 + sources/Example_atomic_restrict.3.f | 1 + sources/Example_cancellation.1.cpp | 1 + sources/Example_cancellation.1.f90 | 1 + sources/Example_cancellation.2.c | 1 + sources/Example_cancellation.2.f90 | 1 + sources/Example_collapse.1.c | 1 + sources/Example_collapse.1.f | 1 + sources/Example_collapse.2.c | 1 + sources/Example_collapse.2.f | 1 + sources/Example_collapse.3.c | 1 + sources/Example_collapse.3.f | 1 + sources/Example_cpp_reference.1.cpp | 1 + sources/Example_critical.2.f | 1 + sources/Example_declare_target.1.c | 1 + sources/Example_declare_target.1.f90 | 1 + sources/Example_declare_target.2.cpp | 1 + sources/Example_declare_target.2.f90 | 1 + sources/Example_declare_target.3.c | 1 + sources/Example_declare_target.3.f90 | 1 + sources/Example_declare_target.4.c | 1 + sources/Example_declare_target.4.f90 | 1 + sources/Example_declare_target.5.c | 1 + sources/Example_declare_target.5.f90 | 1 + sources/Example_declare_target.6.c | 1 + sources/Example_declare_target.6.f90 | 1 + sources/Example_declare_variant.1.c | 4 +- sources/Example_declare_variant.1.f90 | 3 +- sources/Example_declare_variant.2.c | 3 +- sources/Example_declare_variant.2.f90 | 3 +- sources/Example_depobj.1.c | 3 +- sources/Example_depobj.1.f90 | 4 +- sources/Example_device.1.c | 5 + sources/Example_device.1.f90 | 1 + sources/Example_device.2.c | 1 + sources/Example_device.2.f90 | 1 + sources/Example_device.3.c | 1 + sources/Example_device.3.f90 | 1 + sources/Example_device.4.c | 1 + sources/Example_doacross.1.c | 1 + sources/Example_doacross.1.f90 | 1 + sources/Example_doacross.2.c | 1 + sources/Example_doacross.2.f90 | 1 + sources/Example_doacross.3.c | 1 + sources/Example_doacross.3.f90 | 1 + sources/Example_doacross.4.c | 1 + sources/Example_doacross.4.f90 | 1 + sources/Example_doacross.5.c | 1 + sources/Example_doacross.5.f90 | 1 + sources/Example_host_teams.1.c | 3 +- sources/Example_host_teams.1.f90 | 3 +- sources/Example_init_lock_with_hint.1.cpp | 1 + sources/Example_init_lock_with_hint.1.f | 1 + sources/Example_lastprivate.2.c | 23 + sources/Example_lastprivate.2.f90 | 21 + sources/Example_linear_in_loop.1.c | 1 + sources/Example_linear_in_loop.1.f90 | 1 + sources/Example_linear_modifier.1.cpp | 45 + sources/Example_linear_modifier.1.f90 | 48 + sources/Example_linear_modifier.2.cpp | 44 + sources/Example_linear_modifier.2.f90 | 45 + sources/Example_linear_modifier.3.c | 45 + sources/Example_linear_modifier.3.f90 | 47 + sources/Example_loop.1.c | 3 +- sources/Example_loop.1.f90 | 6 +- sources/Example_mem_model.1.c | 13 +- sources/Example_mem_model.1.f90 | 10 +- sources/Example_mem_model.2.c | 61 +- sources/Example_mem_model.2.f | 42 +- sources/Example_mem_model.3.c | 43 +- sources/Example_mem_model.3.f | 61 +- sources/Example_metadirective.1.c | 3 +- sources/Example_metadirective.1.f90 | 6 +- sources/Example_metadirective.2.c | 8 +- sources/Example_metadirective.2.f90 | 11 +- sources/Example_metadirective.3.c | 3 +- sources/Example_metadirective.3.f90 | 4 +- sources/Example_parallel_master_taskloop.1.c | 1 + .../Example_parallel_master_taskloop.1.f90 | 1 + sources/Example_pra_iterator.1.cpp | 1 + sources/Example_reduction.1.c | 1 + sources/Example_reduction.7.c | 1 + sources/Example_requires.1.cpp | 3 +- sources/Example_requires.1.f90 | 3 +- sources/Example_scan.1.c | 33 + sources/Example_scan.1.f90 | 30 + sources/Example_scan.2.c | 33 + sources/Example_scan.2.f90 | 30 + sources/Example_standalone.1.c | 1 + sources/Example_standalone.1.f90 | 1 + sources/Example_standalone.2.c | 1 + sources/Example_standalone.2.f90 | 1 + sources/Example_target.1.c | 1 + sources/Example_target.1.f90 | 1 + sources/Example_target.2.c | 1 + sources/Example_target.2.f90 | 1 + sources/Example_target.3.c | 1 + sources/Example_target.3.f90 | 1 + sources/Example_target.4.c | 1 + sources/Example_target.4.f90 | 1 + sources/Example_target.4b.f90 | 1 + sources/Example_target.5.c | 6 + sources/Example_target.5.f90 | 5 + sources/Example_target.6.c | 6 + sources/Example_target.6.f90 | 5 + sources/Example_target_data.1.c | 1 + sources/Example_target_data.1.f90 | 1 + sources/Example_target_data.2.c | 1 + sources/Example_target_data.2.f90 | 1 + sources/Example_target_data.3.c | 1 + sources/Example_target_data.3.f90 | 1 + sources/Example_target_data.4.c | 1 + sources/Example_target_data.4.f90 | 1 + sources/Example_target_data.5.cpp | 1 + sources/Example_target_data.5.f90 | 1 + sources/Example_target_data.6.c | 1 + sources/Example_target_data.6.f90 | 1 + sources/Example_target_data.7.c | 1 + sources/Example_target_data.7.f90 | 1 + sources/Example_target_defaultmap.1.c | 93 + sources/Example_target_defaultmap.1.f90 | 105 + sources/Example_target_mapper.1.c | 5 +- sources/Example_target_mapper.1.f90 | 4 +- sources/Example_target_mapper.2.c | 3 +- sources/Example_target_mapper.2.f90 | 1 + sources/Example_target_mapper.3.c | 3 +- sources/Example_target_mapper.3.f90 | 1 + sources/Example_target_offload_control.1.c | 3 +- sources/Example_target_offload_control.1.f90 | 3 +- sources/Example_target_ptr_map.1.c | 3 +- sources/Example_target_ptr_map.2.c | 1 + sources/Example_target_ptr_map.3a.c | 43 + sources/Example_target_ptr_map.3b.c | 40 + sources/Example_target_reduction.1.c | 34 + sources/Example_target_reduction.1.f90 | 40 + sources/Example_target_reduction.2.c | 36 + sources/Example_target_reduction.2.f90 | 43 + sources/Example_target_reverse_offload.7.c | 1 + sources/Example_target_reverse_offload.7.f90 | 7 +- sources/Example_target_struct_map.1.c | 1 + sources/Example_target_struct_map.2.c | 1 + sources/Example_target_struct_map.2.cpp | 1 + sources/Example_target_task_reduction.1.c | 32 + sources/Example_target_task_reduction.1.f90 | 40 + sources/Example_target_task_reduction.2a.c | 35 + sources/Example_target_task_reduction.2a.f90 | 38 + sources/Example_target_task_reduction.2b.c | 30 + sources/Example_target_task_reduction.2b.f90 | 38 + sources/Example_target_unstructured_data.1.c | 1 + .../Example_target_unstructured_data.1.cpp | 1 + .../Example_target_unstructured_data.1.f90 | 1 + sources/Example_target_update.1.c | 2 + sources/Example_target_update.1.f90 | 1 + sources/Example_target_update.2.c | 1 + sources/Example_target_update.2.f90 | 1 + sources/Example_task_dep.1.c | 1 + sources/Example_task_dep.1.f90 | 1 + sources/Example_task_dep.10.c | 3 + sources/Example_task_dep.10.f90 | 1 + sources/Example_task_dep.11.c | 4 +- sources/Example_task_dep.11.f90 | 6 +- sources/Example_task_dep.12.c | 29 + sources/Example_task_dep.12.f90 | 27 + sources/Example_task_dep.2.c | 1 + sources/Example_task_dep.2.f90 | 1 + sources/Example_task_dep.3.c | 1 + sources/Example_task_dep.3.f90 | 1 + sources/Example_task_dep.4.c | 1 + sources/Example_task_dep.4.f90 | 1 + sources/Example_task_dep.5.c | 1 + sources/Example_task_dep.5.f90 | 1 + sources/Example_task_dep.6.c | 1 + sources/Example_task_dep.6.f90 | 1 + sources/Example_task_dep.7.c | 1 + sources/Example_task_dep.7.f90 | 1 + sources/Example_task_dep.8.c | 1 + sources/Example_task_dep.8.f90 | 1 + sources/Example_task_dep.9.c | 1 + sources/Example_task_dep.9.f90 | 1 + sources/Example_task_priority.1.c | 1 + sources/Example_task_priority.1.f90 | 1 + sources/Example_task_reduction.1.c | 6 +- sources/Example_task_reduction.2.c | 45 + sources/Example_task_reduction.2.f90 | 47 + sources/Example_taskgroup.1.c | 1 + sources/Example_taskgroup.1.f90 | 1 + sources/Example_tasking.1.c | 1 + sources/Example_tasking.1.f90 | 1 + sources/Example_tasking.10.c | 1 + sources/Example_tasking.10.f90 | 1 + sources/Example_tasking.11.c | 1 + sources/Example_tasking.11.f90 | 1 + sources/Example_tasking.12.c | 1 + sources/Example_tasking.12.f90 | 1 + sources/Example_tasking.13.c | 1 + sources/Example_tasking.13.f90 | 1 + sources/Example_tasking.14.c | 1 + sources/Example_tasking.14.f90 | 1 + sources/Example_tasking.15.c | 1 + sources/Example_tasking.15.f90 | 1 + sources/Example_tasking.16.c | 1 + sources/Example_tasking.16.f90 | 1 + sources/Example_tasking.17.c | 1 + sources/Example_tasking.17.f90 | 1 + sources/Example_tasking.18.c | 1 + sources/Example_tasking.18.f90 | 1 + sources/Example_tasking.19.c | 1 + sources/Example_tasking.19.f90 | 1 + sources/Example_tasking.2.c | 1 + sources/Example_tasking.2.f90 | 1 + sources/Example_tasking.3.c | 1 + sources/Example_tasking.3.f90 | 1 + sources/Example_tasking.4.c | 1 + sources/Example_tasking.4.f | 1 + sources/Example_tasking.5.c | 4 +- sources/Example_tasking.5.f | 2 + sources/Example_tasking.6.c | 1 + sources/Example_tasking.6.f | 1 + sources/Example_tasking.7.c | 1 + sources/Example_tasking.7.f | 1 + sources/Example_tasking.8.c | 1 + sources/Example_tasking.8.f | 1 + sources/Example_tasking.9.c | 1 + sources/Example_tasking.9.f | 1 + sources/Example_taskloop.1.c | 1 + sources/Example_taskloop.1.f90 | 1 + sources/Example_taskloop.2.c | 1 + sources/Example_taskloop.2.f90 | 1 + sources/Example_taskloop_reduction.1.c | 3 +- sources/Example_taskloop_reduction.1.f90 | 4 +- sources/Example_taskloop_reduction.2.c | 3 +- sources/Example_taskloop_reduction.2.f90 | 4 +- sources/Example_taskloop_simd_reduction.1.c | 1 + sources/Example_taskloop_simd_reduction.1.f90 | 3 +- sources/Example_taskyield.1.c | 1 + sources/Example_taskyield.1.f90 | 1 + sources/Example_teams.1.c | 1 + sources/Example_teams.1.f90 | 1 + sources/Example_teams.2.c | 1 + sources/Example_teams.2.f90 | 1 + sources/Example_teams.3.c | 1 + sources/Example_teams.3.f90 | 1 + sources/Example_teams.4.c | 1 + sources/Example_teams.4.f90 | 1 + sources/Example_teams.5.c | 1 + sources/Example_teams.5.f90 | 1 + sources/Example_teams.6.c | 1 + sources/Example_teams.6.f90 | 1 + sources/Example_udr.1.c | 1 + sources/Example_udr.1.f90 | 1 + sources/Example_udr.2.c | 1 + sources/Example_udr.2.f90 | 1 + sources/Example_udr.3.c | 6 +- sources/Example_udr.3.f90 | 1 + sources/Example_udr.4.f90 | 1 + sources/Example_udr.5.cpp | 1 + sources/Example_udr.6.cpp | 1 + sources/test_code_one | 15 + sources/test_codes | 55 + util/latexdiff/VERSION | 4 + util/latexdiff/latexdiff | 4951 +++++++++++++++ util/latexdiff/latexdiff-fast | 5512 +++++++++++++++++ util/latexdiff/latexdiff-vc | 824 +++ 406 files changed, 14118 insertions(+), 557 deletions(-) create mode 100644 Examples_linear_modifier.tex create mode 100644 Examples_scan.tex create mode 100644 Examples_target_defaultmap.tex create mode 100644 latexdiff.cfg create mode 100644 sources/Example_array_shaping.1.f90 create mode 100644 sources/Example_lastprivate.2.c create mode 100644 sources/Example_lastprivate.2.f90 create mode 100644 sources/Example_linear_modifier.1.cpp create mode 100644 sources/Example_linear_modifier.1.f90 create mode 100644 sources/Example_linear_modifier.2.cpp create mode 100644 sources/Example_linear_modifier.2.f90 create mode 100644 sources/Example_linear_modifier.3.c create mode 100644 sources/Example_linear_modifier.3.f90 create mode 100644 sources/Example_scan.1.c create mode 100644 sources/Example_scan.1.f90 create mode 100644 sources/Example_scan.2.c create mode 100644 sources/Example_scan.2.f90 create mode 100644 sources/Example_target_defaultmap.1.c create mode 100644 sources/Example_target_defaultmap.1.f90 create mode 100644 sources/Example_target_ptr_map.3a.c create mode 100644 sources/Example_target_ptr_map.3b.c create mode 100644 sources/Example_target_reduction.1.c create mode 100644 sources/Example_target_reduction.1.f90 create mode 100644 sources/Example_target_reduction.2.c create mode 100644 sources/Example_target_reduction.2.f90 create mode 100644 sources/Example_target_task_reduction.1.c create mode 100644 sources/Example_target_task_reduction.1.f90 create mode 100644 sources/Example_target_task_reduction.2a.c create mode 100644 sources/Example_target_task_reduction.2a.f90 create mode 100644 sources/Example_target_task_reduction.2b.c create mode 100644 sources/Example_target_task_reduction.2b.f90 create mode 100644 sources/Example_task_dep.12.c create mode 100644 sources/Example_task_dep.12.f90 create mode 100644 sources/Example_task_reduction.2.c create mode 100644 sources/Example_task_reduction.2.f90 create mode 100644 sources/test_code_one create mode 100755 sources/test_codes create mode 100644 util/latexdiff/VERSION create mode 100755 util/latexdiff/latexdiff create mode 100755 util/latexdiff/latexdiff-fast create mode 100755 util/latexdiff/latexdiff-vc diff --git a/Chap_memory_model.tex b/Chap_memory_model.tex index 6447dcd..85dfcdf 100644 --- a/Chap_memory_model.tex +++ b/Chap_memory_model.tex @@ -48,15 +48,14 @@ document. In this chapter, examples illustrate how race conditions may arise for accesses to variables with a \plc{shared} data-sharing attribute when flush operations are not properly employed. A race condition can exist when two or more threads -are involved in accessing a variable in which not all of the accesses are -reads; that is, a WaR, RaW or WaW condition exists (R=read, a=after, W=write). -A RaR does not produce a race condition. In particular, a data race will arise -when conflicting accesses do not have a well-defined \emph{completion order}. -The existence of data races in OpenMP programs result in undefined behavior, -and so they should generally be avoided for programs to be correct. The -completion order of accesses to a shared variable is guaranteed in OpenMP -through a set of memory consistency rules that are described in the \plc{OpenMP -Memory Consitency} section of the OpenMP Specifications document. +are involved in accessing a variable and at least one of the accesses modifies +the variable. In particular, a data race will arise when conflicting accesses +do not have a well-defined \emph{completion order}. The existence of data +races in OpenMP programs result in undefined behavior, and so they should +generally be avoided for programs to be correct. The completion order of +accesses to a shared variable is guaranteed in OpenMP through a set of memory +consistency rules that are described in the \plc{OpenMP Memory Consitency} +section of the OpenMP Specifications document. %This chapter also includes examples that exhibit non-sequentially consistent %(\emph{non-SC}) behavior. Sequential consistency (\emph{SC}) is the desirable diff --git a/Chap_tasking.tex b/Chap_tasking.tex index 4cb72c7..59e15da 100644 --- a/Chap_tasking.tex +++ b/Chap_tasking.tex @@ -40,8 +40,9 @@ for executing the task to completion, even though it may leave the execution at a scheduling point and return later. The thread is tied to the task. Scheduling points can be introduced with the \code{taskyield} construct. With an \code{untied} clause any other thread is allowed to continue -the task. An \code{if} clause with a \plc{true} expression allows the -generating thread to immediately execute the task as an undeferred task. +the task. An \code{if} clause with an expression that evaluates to \plc{false} +results in an \emph{undeferred} task, which instructs the runtime to suspend +the generating task until the undeferred task completes its execution. By including the data environment of the generating task into the generated task with the \code{mergeable} and \code{final} clauses, task generation overhead can be reduced. diff --git a/Examples_Chapt.tex b/Examples_Chapt.tex index ebc689c..ce772ee 100644 --- a/Examples_Chapt.tex +++ b/Examples_Chapt.tex @@ -19,3 +19,8 @@ source form. \plc{ext} is one of the following: \item \plc{f90} -- Fortran code in free form. \end{compactitem} +Some of the example labels may include version information +(\code{\small{}omp\_\plc{verno}}) to indicate features that are illustrated +by an example for a specific OpenMP version, such as ``\plc{scan.1.c} +\;(\code{\small{}omp\_5.0}).'' + diff --git a/Examples_SIMD.tex b/Examples_SIMD.tex index 6008fd8..fd1f29e 100644 --- a/Examples_SIMD.tex +++ b/Examples_SIMD.tex @@ -5,9 +5,9 @@ The following example illustrates the basic use of the \code{simd} construct to assure the compiler that the loop can be vectorized. -\cexample{SIMD}{1} +\cexample[4.0]{SIMD}{1} -\ffreeexample{SIMD}{1} +\ffreeexample[4.0]{SIMD}{1} \clearpage @@ -40,9 +40,9 @@ In the \code{simd} constructs for the loops the \code{private(tmp)} clause is necessary to assure that the each vector operation has its own \plc{tmp} variable. -\cexample{SIMD}{2} +\cexample[4.0]{SIMD}{2} -\ffreeexample{SIMD}{2} +\ffreeexample[4.0]{SIMD}{2} \pagebreak A thread that encounters a SIMD construct executes a vectorized code of the @@ -52,9 +52,9 @@ privatized and declared as reductions with clauses. The example below illustrates the use of \code{private} and \code{reduction} clauses in a SIMD construct. -\cexample{SIMD}{3} +\cexample[4.0]{SIMD}{3} -\ffreeexample{SIMD}{3} +\ffreeexample[4.0]{SIMD}{3} \pagebreak @@ -68,9 +68,9 @@ code is safe for vectors up to and including size 16. In the loop, \plc{m} can be 16 or greater, for correct code execution. If the value of \plc{m} is less than 16, the behavior is undefined. -\cexample{SIMD}{4} +\cexample[4.0]{SIMD}{4} -\ffreeexample{SIMD}{4} +\ffreeexample[4.0]{SIMD}{4} \pagebreak The following SIMD construct instructs the compiler to collapse the \plc{i} and @@ -78,9 +78,9 @@ The following SIMD construct instructs the compiler to collapse the \plc{i} and threads of the team. Within the workshared loop chunks of a thread, the SIMD chunks are executed in the lanes of the vector units. -\cexample{SIMD}{5} +\cexample[4.0]{SIMD}{5} -\ffreeexample{SIMD}{5} +\ffreeexample[4.0]{SIMD}{5} %%% section @@ -95,9 +95,9 @@ the other hand, the \code{inbranch} clause for the function goo indicates that the function is always called conditionally in the SIMD loop inside the function \plc{myaddfloat}. -\cexample{SIMD}{6} +\cexample[4.0]{SIMD}{6} -\ffreeexample{SIMD}{6} +\ffreeexample[4.0]{SIMD}{6} In the code below, the function \plc{fib()} is called in the main program and @@ -106,9 +106,9 @@ condition. The compiler creates a masked vector version and a non-masked vector version for the function \plc{fib()} while retaining the original scalar version of the \plc{fib()} function. -\cexample{SIMD}{7} +\cexample[4.0]{SIMD}{7} -\ffreeexample{SIMD}{7} +\ffreeexample[4.0]{SIMD}{7} @@ -124,7 +124,7 @@ A loop can be vectorized even though the iterations are not completely independe This test assures that the compiler preserves the loop carried lexical forward-dependence for generating a correct SIMD code. -\cexample{SIMD}{8} +\cexample[4.0]{SIMD}{8} -\ffreeexample{SIMD}{8} +\ffreeexample[4.0]{SIMD}{8} diff --git a/Examples_acquire_release.tex b/Examples_acquire_release.tex index 5205277..3f91622 100644 --- a/Examples_acquire_release.tex +++ b/Examples_acquire_release.tex @@ -67,8 +67,8 @@ by thread 0 and the read from \plc{x} by thread 1, and so thread 1 must see that \plc{x} equals 10. \pagebreak -\cexample{acquire_release}{1} -\ffreeexample{acquire_release}{1} +\cexample[5.0]{acquire_release}{1} +\ffreeexample[5.0]{acquire_release}{1} In the second example, the \code{critical} constructs are exchanged with \code{atomic} constructs that have \textit{explicit} memory ordering specified. When the @@ -77,8 +77,8 @@ results in a release/acquire synchronization that in turn implies that the assignment to \plc{x} on thread 0 happens before the read of \plc{x} on thread 1. Therefore, thread 1 will print ``x = 10''. -\cexample{acquire_release}{2} -\ffreeexample{acquire_release}{2} +\cexample[5.0]{acquire_release}{2} +\ffreeexample[5.0]{acquire_release}{2} \pagebreak In the third example, \code{atomic} constructs that specify relaxed atomic @@ -105,8 +105,8 @@ construct used in Example 2 for thread 1. %} %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%3 -\cexample{acquire_release}{3} -\ffreeexample{acquire_release}{3} +\cexample[5.0]{acquire_release}{3} +\ffreeexample[5.0]{acquire_release}{3} Example 4 will fail to order the write to \plc{x} on thread 0 before the read from \plc{x} on thread 1. Importantly, the implicit release flush on exit from @@ -137,5 +137,5 @@ modifies \plc{y} and provides release semantics must be specified. %by thread 0. %} -\cexample{acquire_release_broke}{4} -\ffreeexample{acquire_release_broke}{4} +\cexample[5.0]{acquire_release_broke}{4} +\ffreeexample[5.0]{acquire_release_broke}{4} diff --git a/Examples_affinity.tex b/Examples_affinity.tex index 76050e5..be0c94c 100644 --- a/Examples_affinity.tex +++ b/Examples_affinity.tex @@ -34,9 +34,9 @@ the partition list when the number of threads is less than or equal to the numbe of places in the parent's place partition, for the machine architecture depicted above. Note that the threads are bound to the first place of each subpartition. -\cexample{affinity}{1} +\cexample[4.0]{affinity}{1} -\fexample{affinity}{1} +\fexample[4.0]{affinity}{1} It is unspecified on which place the master thread is initially started. If the master thread is initially started on p0, the following placement of threads will @@ -75,9 +75,9 @@ parent's place partition. The first \plc{T/P} threads of the team (including the thread) execute on the parent's place. The next \plc{T/P} threads execute on the next place in the place partition, and so on, with wrap around. -\cexample{affinity}{2} +\cexample[4.0]{affinity}{2} -\ffreeexample{affinity}{2} +\ffreeexample[4.0]{affinity}{2} It is unspecified on which place the master thread is initially started. If the master thread is initially started on p0, the following placement of threads will @@ -130,9 +130,9 @@ the partition list when the number of threads is less than or equal to the numbe of places in parent's place partition, for the machine architecture depicted above. The place partition is not changed by the \code{close} policy. -\cexample{affinity}{3} +\cexample[4.0]{affinity}{3} -\fexample{affinity}{3} +\fexample[4.0]{affinity}{3} It is unspecified on which place the master thread is initially started. If the master thread is initially started on p0, the following placement of threads will @@ -171,9 +171,9 @@ thread) execute on the parent's place. The next \plc{T/P} threads execute on the place in the place partition, and so on, with wrap around. The place partition is not changed by the \code{close} policy. -\cexample{affinity}{4} +\cexample[4.0]{affinity}{4} -\ffreeexample{affinity}{4} +\ffreeexample[4.0]{affinity}{4} It is unspecified on which place the master thread is initially started. If the master thread is initially running on p0, the following placement of threads will @@ -225,9 +225,9 @@ The following example shows the result of the \code{master} affinity policy on the partition list for the machine architecture depicted above. The place partition is not changed by the master policy. -\cexample{affinity}{5} +\cexample[4.0]{affinity}{5} -\fexample{affinity}{5} +\fexample[4.0]{affinity}{5} It is unspecified on which place the master thread is initially started. If the master thread is initially running on p0, the following placement of threads will diff --git a/Examples_affinity_display.tex b/Examples_affinity_display.tex index 03f2f86..10aa0dc 100644 --- a/Examples_affinity_display.tex +++ b/Examples_affinity_display.tex @@ -28,9 +28,9 @@ not changed, so affinity is NOT reported. In the last parallel region, the thread affinities are reported because the thread affinity has changed. -\cexample{affinity_display}{1} +\cexample[5.0]{affinity_display}{1} -\ffreeexample{affinity_display}{1} +\ffreeexample[5.0]{affinity_display}{1} In the following example 2 threads are forked, and each executes on a socket. Next, @@ -58,9 +58,9 @@ the parallel nesting level (\%L), the ancestor thread number (\%a), the thread n and the thread affinity (\%A). In the nested parallel region within the \plc{socket\_work} routine the affinities for the threads on each socket are printed according to this format. -\cexample{affinity_display}{2} +\cexample[5.0]{affinity_display}{2} -\ffreeexample{affinity_display}{2} +\ffreeexample[5.0]{affinity_display}{2} The next example illustrates more details about affinity formatting. First, the \code{omp\_get\_affininity\_format()} API routine is used to @@ -98,7 +98,7 @@ The maximum value for the number of characters (\plc{nchars}) returned by clause and the \plc{if(nchars >= max\_req\_store) max\_req\_store=nchars} statement. It is used to report possible truncation (if \plc{max\_req\_store} > \plc{buffer\_store}). -\cexample{affinity_display}{3} +\cexample[5.0]{affinity_display}{3} -\ffreeexample{affinity_display}{3} +\ffreeexample[5.0]{affinity_display}{3} diff --git a/Examples_affinity_query.tex b/Examples_affinity_query.tex index 1630aaf..2cd0d57 100644 --- a/Examples_affinity_query.tex +++ b/Examples_affinity_query.tex @@ -37,7 +37,7 @@ On some systems there are utilities, files or user guides that provide configura information. For instance, the socket number and proc\_id's for a socket can be found in the /proc/cpuinfo text file on Linux systems. -\cexample{affinity_query}{1} +\cexample[4.5]{affinity_query}{1} -\ffreeexample{affinity_query}{1} +\ffreeexample[4.5]{affinity_query}{1} diff --git a/Examples_allocators.tex b/Examples_allocators.tex index a51f439..d3e473b 100644 --- a/Examples_allocators.tex +++ b/Examples_allocators.tex @@ -57,7 +57,7 @@ and the set of all variables used in the allocate statement is specified in the %\pagebreak - \cexample{allocators}{1} -\ffreeexample{allocators}{1} +\cexample[5.0]{allocators}{1} +\ffreeexample[5.0]{allocators}{1} diff --git a/Examples_array_sections.tex b/Examples_array_sections.tex index c970780..648c4d2 100644 --- a/Examples_array_sections.tex +++ b/Examples_array_sections.tex @@ -8,31 +8,31 @@ on \code{target} and \code{target} \code{data} constructs. This example shows the invalid usage of two separate sections of the same array inside of a \code{target} construct. -\cexample{array_sections}{1} +\cexample[4.0]{array_sections}{1} -\ffreeexample{array_sections}{1} +\ffreeexample[4.0]{array_sections}{1} \pagebreak This example shows the invalid usage of two separate sections of the same array inside of a \code{target} construct. -\cexample{array_sections}{2} +\cexample[4.0]{array_sections}{2} -\ffreeexample{array_sections}{2} +\ffreeexample[4.0]{array_sections}{2} \pagebreak This example shows the valid usage of two separate sections of the same array inside of a \code{target} construct. -\cexample{array_sections}{3} +\cexample[4.0]{array_sections}{3} -\ffreeexample{array_sections}{3} +\ffreeexample[4.0]{array_sections}{3} \pagebreak This example shows the valid usage of a wholly contained array section of an already mapped array section inside of a \code{target} construct. -\cexample{array_sections}{4} +\cexample[4.0]{array_sections}{4} -\ffreeexample{array_sections}{4} +\ffreeexample[4.0]{array_sections}{4} diff --git a/Examples_array_shaping.tex b/Examples_array_shaping.tex index b2697b9..75d6bae 100644 --- a/Examples_array_shaping.tex +++ b/Examples_array_shaping.tex @@ -23,5 +23,13 @@ Note the use of additional parentheses around the shape-operator and $a$ to ensure the correct precedence over array-section operations. -\cnexample{array_shaping}{1} +\cnexample[5.0]{array_shaping}{1} \ccppspecificend + +The shape operator is not defined for Fortran. Explicit array shaping +of procedure arguments can be used instead to achieve a similar goal. +Below is the Fortran-equivalent of the above example that illustrates +the support of transferring two rows of noncontiguous boundary +data in the \code{target}~\code{update} directive. + +\ffreeexample[5.0]{array_shaping}{1} diff --git a/Examples_associate.tex b/Examples_associate.tex index 4e8f5a2..5d7899c 100644 --- a/Examples_associate.tex +++ b/Examples_associate.tex @@ -11,13 +11,13 @@ name \plc{b} is associated with the shared variable \plc{a}. With the predetermi attribute rule, the associate name \plc{b} is not allowed to be specified on the \code{private} clause. -\fnexample{associate}{1} +\fnexample[4.0]{associate}{1} In next example, within the \code{parallel} construct, the association name \plc{thread\_id} is associated with the private copy of \plc{i}. The print statement should output the unique thread number. -\fnexample{associate}{2} +\fnexample[4.0]{associate}{2} The following example illustrates the effect of specifying a selector name on a data-sharing attribute clause. The associate name \plc{u} is associated with \plc{v} and the variable \plc{v} @@ -27,6 +27,6 @@ The association between \plc{u} and the original \plc{v} is retained (see the Da Attribute Rules section in the OpenMP 4.0 API Specifications). Inside the \code{parallel} region, \plc{v} has the value of -1 and \plc{u} has the value of the original \plc{v}. -\ffreenexample{associate}{3} +\ffreenexample[4.0]{associate}{3} \fortranspecificend diff --git a/Examples_async_target_nowait.tex b/Examples_async_target_nowait.tex index 087af00..b88fb4b 100644 --- a/Examples_async_target_nowait.tex +++ b/Examples_async_target_nowait.tex @@ -26,6 +26,6 @@ one thread is being used for offload generation. In the situation where little time is spent by the \plc{target task} in setting up and tearing down the the target execution, \code{static} scheduling may be desired. -\cexample{async_target}{3} +\cexample[4.5]{async_target}{3} -\ffreeexample{async_target}{3} +\ffreeexample[4.5]{async_target}{3} diff --git a/Examples_async_target_nowait_depend.tex b/Examples_async_target_nowait_depend.tex index 1cf260d..11dc6e5 100644 --- a/Examples_async_target_nowait_depend.tex +++ b/Examples_async_target_nowait_depend.tex @@ -11,8 +11,8 @@ The last dependence is produced by array \plc{p} with the \code{out} dependence The \code{nowait} clause on the \code{target} construct creates a deferrable \plc{target task}, allowing the encountering task to continue execution without waiting for the completion of the \plc{target task}. -\cexample{async_target}{4} +\cexample[4.5]{async_target}{4} -\ffreeexample{async_target}{4} +\ffreeexample[4.5]{async_target}{4} %end diff --git a/Examples_async_target_with_tasks.tex b/Examples_async_target_with_tasks.tex index 09bf78c..7df03b1 100644 --- a/Examples_async_target_with_tasks.tex +++ b/Examples_async_target_with_tasks.tex @@ -9,20 +9,20 @@ scheduling point while waiting for the execution of the \code{target} region to complete, allowing the thread to switch back to the execution of the encountering task or one of the previously generated explicit tasks. -\cexample{async_target}{1} +\cexample[4.0]{async_target}{1} \pagebreak The Fortran version has an interface block that contains the \code{declare} \code{target}. An identical statement exists in the function declaration (not shown here). -\ffreeexample{async_target}{1} +\ffreeexample[4.0]{async_target}{1} The following example shows how the \code{task} and \code{target} constructs are used to execute multiple \code{target} regions asynchronously. The task dependence ensures that the storage is allocated and initialized on the device before it is accessed. -\cexample{async_target}{2} +\cexample[4.0]{async_target}{2} The Fortran example below is similar to the C version above. Instead of pointers, though, it uses the convenience of Fortran allocatable arrays on the device. In order to preserve the arrays @@ -52,4 +52,4 @@ section of the specification.) However, the intention is to relax the restrictions on mapping of allocatable variables in the next release of the specification so that the example will be compliant. -\ffreeexample{async_target}{2} +\ffreeexample[4.0]{async_target}{2} diff --git a/Examples_atomic.tex b/Examples_atomic.tex index 06f280c..620c53e 100644 --- a/Examples_atomic.tex +++ b/Examples_atomic.tex @@ -14,9 +14,9 @@ Note that the \code{atomic} directive applies only to the statement immediately following it. As a result, elements of \plc{y} are not updated atomically in this example. -\cexample{atomic}{1} +\cexample[3.1]{atomic}{1} -\fexample{atomic}{1} +\fexample[3.1]{atomic}{1} The following example illustrates the \code{read} and \code{write} clauses for the \code{atomic} directive. These clauses ensure that the given variable @@ -26,9 +26,9 @@ another part of the variable. Note that most hardware provides atomic reads and writes for some set of properly aligned variables of specific sizes, but not necessarily for all the variable types supported by the OpenMP API. -\cexample{atomic}{2} +\cexample[3.1]{atomic}{2} -\fexample{atomic}{2} +\fexample[3.1]{atomic}{2} The following example illustrates the \code{capture} clause for the \code{atomic} directive. In this case the value of a variable is captured, and then the variable @@ -37,8 +37,8 @@ be implemented using the fetch-and-add instruction available on many kinds of ha The example also shows a way to implement a spin lock using the \code{capture} and \code{read} clauses. -\cexample{atomic}{3} +\cexample[3.1]{atomic}{3} -\fexample{atomic}{3} +\fexample[3.1]{atomic}{3} diff --git a/Examples_atomic_restrict.tex b/Examples_atomic_restrict.tex index 9599e05..93080da 100644 --- a/Examples_atomic_restrict.tex +++ b/Examples_atomic_restrict.tex @@ -5,21 +5,21 @@ The following non-conforming examples illustrate the restrictions on the \code{atomic} construct. -\cexample{atomic_restrict}{1} +\cexample[3.1]{atomic_restrict}{1} -\fexample{atomic_restrict}{1} +\fexample[3.1]{atomic_restrict}{1} -\cexample{atomic_restrict}{2} +\cexample[3.1]{atomic_restrict}{2} \fortranspecificstart The following example is non-conforming because \code{I} and \code{R} reference the same location but have different types. -\fnexample{atomic_restrict}{2} +\fnexample[3.1]{atomic_restrict}{2} Although the following example might work on some implementations, this is also non-conforming: -\fnexample{atomic_restrict}{3} +\fnexample[3.1]{atomic_restrict}{3} \fortranspecificend diff --git a/Examples_cancellation.tex b/Examples_cancellation.tex index 05d41b6..7ebcd60 100644 --- a/Examples_cancellation.tex +++ b/Examples_cancellation.tex @@ -11,7 +11,7 @@ exception is properly handled in the sequential part. If cancellation of the \co region has been requested, some threads might have executed \code{phase\_1()}. However, it is guaranteed that none of the threads executed \code{phase\_2()}. -\cppexample{cancellation}{1} +\cppexample[4.0]{cancellation}{1} The following example illustrates the use of the \code{cancel} construct in error @@ -20,7 +20,7 @@ the cancellation is activated. The encountering thread sets the shared variable \code{err} and other threads of the binding thread set proceed to the end of the worksharing construct after the cancellation has been activated. -\ffreeexample{cancellation}{1} +\ffreeexample[4.0]{cancellation}{1} \clearpage @@ -34,11 +34,11 @@ task group to control the effect of the \code{cancel taskgroup} directive. The \plc{level} argument is used to create undeferred tasks after the first ten levels of the tree. -\cexample{cancellation}{2} +\cexample[4.0]{cancellation}{2} The following is the equivalent parallel search example in Fortran. -\ffreeexample{cancellation}{2} +\ffreeexample[4.0]{cancellation}{2} diff --git a/Examples_collapse.tex b/Examples_collapse.tex index 4a59066..6986ae4 100644 --- a/Examples_collapse.tex +++ b/Examples_collapse.tex @@ -16,9 +16,9 @@ The variable \code{j} can be omitted from the \code{private} clause when the from the \code{private} clause. In either case, \code{k} is implicitly private and could be omitted from the \code{private} clause. -\cexample{collapse}{1} +\cexample[3.0]{collapse}{1} -\fexample{collapse}{1} +\fexample[3.0]{collapse}{1} In the next example, the \code{k} and \code{j} loops are associated with the loop construct. So the iterations of the \code{k} and \code{j} loops are collapsed @@ -33,9 +33,9 @@ will have the value \code{2} and \code{j} will have the value \code{3}. Since by the sequentially last iteration of the collapsed \code{k} and \code{j} loop. This example prints: \code{2 3}. -\cexample{collapse}{2} +\cexample[3.0]{collapse}{2} -\fexample{collapse}{2} +\fexample[3.0]{collapse}{2} The next example illustrates the interaction of the \code{collapse} and \code{ordered} clauses. @@ -71,8 +71,8 @@ The code prints \\ \code{1 3 2} -\cexample{collapse}{3} +\cexample[3.0]{collapse}{3} -\fexample{collapse}{3} +\fexample[3.0]{collapse}{3} diff --git a/Examples_cpp_reference.tex b/Examples_cpp_reference.tex index 2ff2ce8..89f04d8 100644 --- a/Examples_cpp_reference.tex +++ b/Examples_cpp_reference.tex @@ -10,5 +10,5 @@ The following example shows the use of reference types in data-sharing clauses i Additionally it shows how the data-sharing of formal arguments with a C++ reference type on an orphaned task generating construct is determined implicitly. (See the Data-sharing Attribute Rules for Variables Referenced in a Construct Section of the 4.5 OpenMP specification.) -\cppnexample{cpp_reference}{1} +\cppnexample[4.5]{cpp_reference}{1} \cppspecificend diff --git a/Examples_critical.tex b/Examples_critical.tex index c2ed0ea..f897e90 100644 --- a/Examples_critical.tex +++ b/Examples_critical.tex @@ -17,4 +17,4 @@ The following example extends the previous example by adding the \code{hint} cla \cexample{critical}{2} -\fexample{critical}{2} +\fexample[4.5]{critical}{2} diff --git a/Examples_declare_target.tex b/Examples_declare_target.tex index e24d214..2b022dc 100644 --- a/Examples_declare_target.tex +++ b/Examples_declare_target.tex @@ -16,7 +16,7 @@ the \code{target} region (thus \code{fib}) will execute on the host device. For C/C++ codes the declaration of the function \code{fib} appears between the \code{declare} \code{target} and \code{end} \code{declare} \code{target} directives. -\cexample{declare_target}{1} +\cexample[4.0]{declare_target}{1} The Fortran \code{fib} subroutine contains a \code{declare} \code{target} declaration to indicate to the compiler to create an device executable version of the procedure. @@ -27,7 +27,7 @@ The program uses the \code{module\_fib} module, which presents an explicit inter the compiler with the \code{declare} \code{target} declarations for processing the \code{fib} call. -\ffreeexample{declare_target}{1} +\ffreeexample[4.0]{declare_target}{1} The next Fortran example shows the use of an external subroutine. Without an explicit interface (through module use or an interface block) the \code{declare} \code{target} @@ -35,7 +35,7 @@ declarations within a external subroutine are unknown to the main program unit; therefore, a \code{declare} \code{target} must be provided within the program scope for the compiler to determine that a target binary should be available. -\ffreeexample{declare_target}{2} +\ffreeexample[4.0]{declare_target}{2} \subsection{\code{declare} \code{target} Construct for Class Type} \label{subsec:declare_target_class} @@ -47,7 +47,7 @@ of a variable \plc{varY} with a class type \code{typeY}. The member function \co be accessed on a target device because its declaration did not appear between \code{declare} \code{target} and \code{end} \code{declare} \code{target} directives. -\cppnexample{declare_target}{2} +\cppnexample[4.0]{declare_target}{2} \cppspecificend \subsection{\code{declare} \code{target} and \code{end} \code{declare} \code{target} for Variables} @@ -65,13 +65,13 @@ is then used to manage the consistency of the variables \plc{p}, \plc{v1}, and \ data environment of the encountering host device task and the implicit device data environment of the default target device. -\cexample{declare_target}{3} +\cexample[4.0]{declare_target}{3} The Fortran version of the above C code uses a different syntax. Fortran modules use a list syntax on the \code{declare} \code{target} directive to declare mapped variables. -\ffreeexample{declare_target}{3} +\ffreeexample[4.0]{declare_target}{3} The following example also indicates that the function \code{Pfun()} is available on the target device, as well as the variable \plc{Q}, which is mapped to the implicit device @@ -84,7 +84,7 @@ In the following example, the function and variable declarations appear between the \code{declare} \code{target} and \code{end} \code{declare} \code{target} directives. -\cexample{declare_target}{4} +\cexample[4.0]{declare_target}{4} The Fortran version of the above C code uses a different syntax. In Fortran modules a list syntax on the \code{declare} \code{target} directive is used to declare @@ -93,7 +93,7 @@ separated list. When the \code{declare} \code{target} directive is used to declare just the procedure, the procedure name need not be listed -- it is implicitly assumed, as illustrated in the \code{Pfun()} function. -\ffreeexample{declare_target}{4} +\ffreeexample[4.0]{declare_target}{4} \subsection{\code{declare} \code{target} and \code{end} \code{declare} \code{target} with \code{declare} \code{simd}} \label{subsec:declare_target_simd} @@ -104,7 +104,7 @@ is available on a target device. The \code{declare} \code{simd} directive indica that there is a SIMD version of the function \code{P()} that is available on the target device as well as one that is available on the host device. -\cexample{declare_target}{5} +\cexample[4.0]{declare_target}{5} The Fortran version of the above C code uses a different syntax. Fortran modules use a list syntax of the \code{declare} \code{target} declaration for the mapping. @@ -113,7 +113,7 @@ The function declaration does not use a list and implicitly assumes the function name. In this Fortran example row and column indices are reversed relative to the C/C++ example, as is usual for codes optimized for memory access. -\ffreeexample{declare_target}{5} +\ffreeexample[4.0]{declare_target}{5} \subsection{\code{declare}~\code{target} Directive with \code{link} Clause} @@ -137,6 +137,6 @@ globally on the device for part of the program execution. The single precision d are allocated and persist only for the first \code{target} region. Similarly, the double precision data are in scope on the device only for the second \code{target} region. -\cexample{declare_target}{6} -\ffreeexample{declare_target}{6} +\cexample[4.5]{declare_target}{6} +\ffreeexample[4.5]{declare_target}{6} diff --git a/Examples_depobj.tex b/Examples_depobj.tex index 2355138..9ca962b 100644 --- a/Examples_depobj.tex +++ b/Examples_depobj.tex @@ -44,6 +44,6 @@ effectively destroying the depend object. After an object has been uninitialized it can be initialized again with a new dependence type \emph{and} a new variable. -\cexample{depobj}{1} +\cexample[5.0]{depobj}{1} -\ffreeexample{depobj}{1} +\ffreeexample[5.0]{depobj}{1} diff --git a/Examples_device.tex b/Examples_device.tex index 0dd1a87..202688c 100644 --- a/Examples_device.tex +++ b/Examples_device.tex @@ -10,9 +10,9 @@ can be used to query if a code is executing on the initial host device or on a target device. The example then sets the number of threads in the \code{parallel} region based on where the code is executing. -\cexample{device}{1} +\cexample[4.0]{device}{1} -\ffreeexample{device}{1} +\ffreeexample[4.0]{device}{1} \subsection{\code{omp\_get\_num\_devices} Routine} \label{subsec:device_num_devices} @@ -20,9 +20,9 @@ region based on where the code is executing. The following example shows how the \code{omp\_get\_num\_devices} runtime library routine can be used to determine the number of devices. -\cexample{device}{2} +\cexample[4.0]{device}{2} -\ffreeexample{device}{2} +\ffreeexample[4.0]{device}{2} \subsection{\code{omp\_set\_default\_device} and \\ \code{omp\_get\_default\_device} Routines} @@ -32,9 +32,9 @@ The following example shows how the \code{omp\_set\_default\_device} and \code{o runtime library routines can be used to set the default device and determine the default device respectively. -\cexample{device}{3} +\cexample[4.0]{device}{3} -\ffreeexample{device}{3} +\ffreeexample[4.0]{device}{3} \subsection{Target Memory and Device Pointers Routines} @@ -53,5 +53,5 @@ in a \code{target} region by exposing the device pointer in an \code{is\_device\ The example creates an array of cosine values on the default device, to be used on the host device. The function fails if a default device is not available. -\cexample{device}{4} +\cexample[4.5]{device}{4} diff --git a/Examples_doacross.tex b/Examples_doacross.tex index a23ebab..30925b1 100644 --- a/Examples_doacross.tex +++ b/Examples_doacross.tex @@ -19,9 +19,9 @@ with an \code{ordered} clause without a parameter, on the loop directive, and a single \code{ordered} directive without the \code{depend} clause specified for the statement executing the \plc{bar} function. -\cexample{doacross}{1} +\cexample[4.5]{doacross}{1} -\ffreeexample{doacross}{1} +\ffreeexample[4.5]{doacross}{1} The following code is similar to the previous example but with \plc{doacross loop nest} extended to two nested loops, \plc{i} and \plc{j}, @@ -37,9 +37,9 @@ Likewise, the \code{depend(sink:j-1,i)} and \code{depend(sink:j,i-1)} clauses in the Fortran code define cross-iteration dependences from iterations (\plc{j-1, i}) and (\plc{j, i-1}) to iteration (\plc{j, i}). -\cexample{doacross}{2} +\cexample[4.5]{doacross}{2} -\ffreeexample{doacross}{2} +\ffreeexample[4.5]{doacross}{2} The following example shows the incorrect use of the \code{ordered} @@ -51,9 +51,9 @@ clauses define dependences on lexicographically later source iterations (\plc{i+1, j}) and (\plc{i, j+1}), which could cause a deadlock as well since they may not start to execute until the current iteration completes. -\cexample{doacross}{3} +\cexample[4.5]{doacross}{3} -\ffreeexample{doacross}{3} +\ffreeexample[4.5]{doacross}{3} The following example illustrates the use of the \code{collapse} clause for @@ -63,6 +63,6 @@ The example also shows a compliant usage of the dependence source directive placed before the corresponding sink directive. Checking the completion of computation from previous iterations at the sink point can occur after the source statement. -\cexample{doacross}{4} +\cexample[4.5]{doacross}{4} -\ffreeexample{doacross}{4} +\ffreeexample[4.5]{doacross}{4} diff --git a/Examples_host_teams.tex b/Examples_host_teams.tex index a1c436d..6ff9a4f 100644 --- a/Examples_host_teams.tex +++ b/Examples_host_teams.tex @@ -22,7 +22,7 @@ to execute double precision code. Two teams are required, and the thread limit for each team is set to 1/2 of the number of available processors. -\cexample{host_teams}{1} +\cexample[5.0]{host_teams}{1} -\ffreeexample{host_teams}{1} +\ffreeexample[5.0]{host_teams}{1} diff --git a/Examples_init_lock_with_hint.tex b/Examples_init_lock_with_hint.tex index 8109eaa..8541f6e 100644 --- a/Examples_init_lock_with_hint.tex +++ b/Examples_init_lock_with_hint.tex @@ -5,6 +5,6 @@ The following example demonstrates how to initialize an array of locks in a \code{parallel} region by using \code{omp\_init\_lock\_with\_hint}. Note, hints are combined with an \code{|} or \code{+} operator in C/C++ and a \code{+} operator in Fortran. -\cppexample{init_lock_with_hint}{1} +\cppexample[4.5]{init_lock_with_hint}{1} -\fexample{init_lock_with_hint}{1} +\fexample[4.5]{init_lock_with_hint}{1} diff --git a/Examples_lastprivate.tex b/Examples_lastprivate.tex index f4e772e..d2cbd98 100644 --- a/Examples_lastprivate.tex +++ b/Examples_lastprivate.tex @@ -11,4 +11,14 @@ sequentially. \fexample{lastprivate}{1} +\clearpage +The next example illustrates the use of the \code{conditional} modifier in +a \code{lastprivate} clause to return the last value when it may not come from +the last iteration of a loop. +That is, users can preserve the serial equivalence semantics of the loop. +The conditional lastprivate ensures the final value of the variable after the loop +is as if the loop iterations were executed in a sequential order. +\cexample[5.0]{lastprivate}{2} + +\ffreeexample[5.0]{lastprivate}{2} diff --git a/Examples_linear_in_loop.tex b/Examples_linear_in_loop.tex index 3ef1ad7..17d79f6 100644 --- a/Examples_linear_in_loop.tex +++ b/Examples_linear_in_loop.tex @@ -7,7 +7,7 @@ an induction variable (\plc{j}). At the end of the execution of the loop construct, the original variable \plc{j} is updated with the value \plc{N/2} from the last iteration of the loop. -\cexample{linear_in_loop}{1} +\cexample[4.5]{linear_in_loop}{1} -\ffreeexample{linear_in_loop}{1} +\ffreeexample[4.5]{linear_in_loop}{1} diff --git a/Examples_linear_modifier.tex b/Examples_linear_modifier.tex new file mode 100644 index 0000000..c9c1af3 --- /dev/null +++ b/Examples_linear_modifier.tex @@ -0,0 +1,76 @@ +%%% section +\section{\code{ref}, \code{val}, \code{uval} Modifiers for \code{linear} Clause} +\label{sec:linear_modifier} + +When generating vector functions from \code{declare}~\code{simd} directives, it is important for a compiler to know the proper types of function arguments in +order to generate efficient codes. +This is especially true for C++ reference types and Fortran arguments. + +In the following example, the function \plc{add\_one2} has a C++ reference +parameter (or Fortran argument) \plc{p}. Variable \plc{p} gets incremented by 1 in the function. +The caller loop \plc{i} in the main program passes +a variable \plc{k} as a reference to the function \plc{add\_one2} call. +The \code{ref} modifier for the \code{linear} clause on the +\code{declare}~\code{simd} directive is used to annotate the +reference-type parameter \plc{p} to match the property of the variable +\plc{k} in the loop. +This use of reference type is equivalent to the second call to +\plc{add\_one2} with a direct passing of the array element \plc{a[i]}. +In the example, the preferred vector +length 8 is specified for both the caller loop and the callee function. + +When \code{linear(ref(p))} is applied to an argument passed by reference, +it tells the compiler that the addresses in its vector argument are consecutive, +and so the compiler can generate a single vector load or store instead of +a gather or scatter. This allows more efficient SIMD code to be generated with +less source changes. + +\cppexample[4.5]{linear_modifier}{1} +\ffreeexample[4.5]{linear_modifier}{1} +\clearpage + + +The following example is a variant of the above example. The function \plc{add\_one2} in the C++ code includes an additional C++ reference parameter \plc{i}. +The loop index \plc{i} of the caller loop \plc{i} in the main program +is passed as a reference to the function \plc{add\_one2} call. +The loop index \plc{i} has a uniform address with +linear value of step 1 across SIMD lanes. +Thus, the \code{uval} modifier is used for the \code{linear} clause +to annotate the C++ reference-type parameter \plc{i} to match +the property of loop index \plc{i}. + +In the correponding Fortran code the arguments \plc{p} and +\plc{i} in the routine \plc{add\_on2} are passed by references. +Similar modifiers are used for these variables in the \code{linear} clauses +to match with the property at the caller loop in the main program. + +When \code{linear(uval(i))} is applied to an argument passed by reference, it +tells the compiler that its addresses in the vector argument are uniform +so that the compiler can generate a scalar load or scalar store and create +linear values. This allows more efficient SIMD code to be generated with +less source changes. + +\cppexample[4.5]{linear_modifier}{2} +\ffreeexample[4.5]{linear_modifier}{2} + +In the following example, the function \plc{func} takes arrays \plc{x} and \plc{y} as arguments, and accesses the array elements referenced by +the index \plc{i}. +The caller loop \plc{i} in the main program passes a linear copy of +the variable \plc{k} to the function \plc{func}. +The \code{val} modifier is used for the \code{linear} clause +in the \code{declare}~\code{simd} directive for the function +\plc{func} to annotate argument \plc{i} to match the property of +the actual argument \plc{k} passed in the SIMD loop. +Arrays \plc{x} and \plc{y} have uniform addresses across SIMD lanes. + +When \code{linear(val(i):1)} is applied to an argument, +it tells the compiler that its addresses in the vector argument may not be +consecutive, however, their values are linear (with stride 1 here). When the value of \plc{i} is used +in subscript of array references (e.g., \plc{x[i]}), the compiler can generate +a vector load or store instead of a gather or scatter. This allows more +efficient SIMD code to be generated with less source changes. + +\cexample[4.5]{linear_modifier}{3} +\ffreeexample[4.5]{linear_modifier}{3} + + diff --git a/Examples_loop.tex b/Examples_loop.tex index ff94c7e..2c99180 100644 --- a/Examples_loop.tex +++ b/Examples_loop.tex @@ -9,5 +9,5 @@ of the loop are free of data dependencies and may be executed concurrently. It allows the compiler to use heuristics to select the parallelization scheme and compiler-level optimizations for the concurrency. - \cexample{loop}{1} -\ffreeexample{loop}{1} +\cexample[5.0]{loop}{1} +\ffreeexample[5.0]{loop}{1} diff --git a/Examples_mem_model.tex b/Examples_mem_model.tex index 7089570..1f58fb2 100644 --- a/Examples_mem_model.tex +++ b/Examples_mem_model.tex @@ -3,39 +3,52 @@ \section{The OpenMP Memory Model} \label{sec:mem_model} -In the following example, at Print 1, the value of \plc{x} could be either 2 -or 5, depending on the timing of the threads, and the implementation of the assignment -to \plc{x}. There are two reasons that the value at Print 1 might not be 5. -First, Print 1 might be executed before the assignment to \plc{x} is executed. -Second, even if Print 1 is executed after the assignment, the value 5 is not guaranteed -to be seen by thread 1 because a flush may not have been executed by thread 0 since -the assignment. +The following examples illustrate two major concerns for concurrent thread +execution: ordering of thread execution and memory accesses that may or may not +lead to race conditions. -The barrier after Print 1 contains implicit flushes on all threads, as well as -a thread synchronization, so the programmer is guaranteed that the value 5 will -be printed by both Print 2 and Print 3. +In the following example, at Print 1, the value of \code{xval} could be either 2 +or 5, depending on the timing of the threads. The \code{atomic} directives are +necessary for the accesses to \code{x} by threads 1 and 2 to avoid a data race. +If the atomic write completes before the atomic read, thread 1 is guaranteed to +see 5 in \code{xval}. Otherwise, thread 1 is guaranteed to see 2 in \code{xval}. -\cexample{mem_model}{1} +The barrier after Print 1 contains implicit flushes on all threads, as well as +a thread synchronization, so the programmer is guaranteed that the value 5 will +be printed by both Print 2 and Print 3. Since neither Print 2 or Print 3 are modifying +\code{x}, they may concurrently access \code{x} without requiring \code{atomic} +directives to avoid a data race. -\ffreeexample{mem_model}{1} +\cexample[3.1]{mem_model}{1} + +\ffreeexample[3.1]{mem_model}{1} \pagebreak -The following example demonstrates why synchronization is difficult to perform -correctly through variables. The value of flag is undefined in both prints on thread -1 and the value of data is only well-defined in the second print. +The following example demonstrates why synchronization is difficult to perform +correctly through variables. The write to \code{flag} on thread 0 and the read +from \code{flag} in the loop on thread 1 must be atomic to avoid a data race. +When thread 1 breaks out of the loop, \code{flag} will have the value of 1. +However, \code{data} will still be undefined at the first print statement. Only +after the flush of both \code{flag} and \code{data} after the first print +statement will \code{data} have the well-defined value of 42. -\cexample{mem_model}{2} +\cexample[3.1]{mem_model}{2} -\fexample{mem_model}{2} +\fexample[3.1]{mem_model}{2} \pagebreak -The next example demonstrates why synchronization is difficult to perform correctly -through variables. Because the \plc{write}(1)-\plc{flush}(1)-\plc{flush}(2)-\plc{read}(2) -sequence cannot be guaranteed in the example, the statements on thread 0 and thread -1 may execute in either order. +The next example demonstrates why synchronization is difficult to perform +correctly through variables. As in the preceding example, the updates to +\code{flag} and the reading of \code{flag} in the loops on threads 1 and 2 are +performed atomically to avoid data races on \code{flag}. However, the code still +contains data race due to the incorrect use of ``flush with a list'' after the +assignment to \code{data1} on thread 1. By not including \code{flag} in the +flush-set of that \code{flush} directive, the assignment can be reordered with +respect to the subsequent atomic update to \code{flag}. Consequentially, +\code{data1} is undefined at the print statement on thread 2. -\cexample{mem_model}{3} +\cexample[3.1]{mem_model}{3} -\fexample{mem_model}{3} +\fexample[3.1]{mem_model}{3} diff --git a/Examples_metadirective.tex b/Examples_metadirective.tex index ef2fa88..a3c1340 100644 --- a/Examples_metadirective.tex +++ b/Examples_metadirective.tex @@ -28,9 +28,9 @@ directive as selector set, has traits of \plc{kind}, \plc{isa} and \plc{arch}. -\cexample{metadirective}{1} +\cexample[5.0]{metadirective}{1} -\ffreeexample{metadirective}{1} +\ffreeexample[5.0]{metadirective}{1} %\pagebreak In the second example, the \plc{implementation} selector set is specified @@ -47,9 +47,9 @@ traits. Otherwise, just the \code{teams} construct is used without any clauses, as prescribed by the \code{default} clause. -\cexample{metadirective}{2} +\cexample[5.0]{metadirective}{2} -\ffreeexample{metadirective}{2} +\ffreeexample[5.0]{metadirective}{2} \clearpage @@ -83,6 +83,6 @@ the \code{target}~\code{teams} construct has been hoisted out of the function, a as the \plc{variant} directive of the \code{metadirective} directive within the function. %%%%%%%% -\cexample{metadirective}{3} +\cexample[5.0]{metadirective}{3} -\ffreeexample{metadirective}{3} +\ffreeexample[5.0]{metadirective}{3} diff --git a/Examples_parallel_master_taskloop.tex b/Examples_parallel_master_taskloop.tex index c2474cb..d88ead4 100644 --- a/Examples_parallel_master_taskloop.tex +++ b/Examples_parallel_master_taskloop.tex @@ -28,6 +28,6 @@ with appropriate restrictions. The combination of the \code{parallel}~\code{mast with the \code{taskloop} or \code{taskloop}~\code{simd} construct produces no additional restrictions. -\cexample{parallel_master_taskloop}{1} +\cexample[5.0]{parallel_master_taskloop}{1} -\ffreeexample{parallel_master_taskloop}{1} +\ffreeexample[5.0]{parallel_master_taskloop}{1} diff --git a/Examples_pra_iterator.tex b/Examples_pra_iterator.tex index 8008c49..1595a53 100644 --- a/Examples_pra_iterator.tex +++ b/Examples_pra_iterator.tex @@ -5,7 +5,7 @@ The following example shows a parallel random access iterator loop. -\cppnexample{pra_iterator}{1} +\cppnexample[3.0]{pra_iterator}{1} \cppspecificend diff --git a/Examples_reduction.tex b/Examples_reduction.tex index 4e326eb..02cb8b0 100644 --- a/Examples_reduction.tex +++ b/Examples_reduction.tex @@ -12,7 +12,7 @@ The following example demonstrates the \code{reduction} clause; note that some reductions can be expressed in the loop in several ways, as shown for the \code{max} and \code{min} reductions below: -\cexample{reduction}{1} +\cexample[3.1]{reduction}{1} \pagebreak @@ -66,38 +66,148 @@ the start of the \code{parallel} region. \fexample{reduction}{6} -The following example demonstrates the reduction of array \plc{a}. In C/C++ this is illustrated by the explicit use of an array section \plc{a[0:N]} in the \code{reduction} clause. The corresponding Fortran example uses array syntax supported in the base language. As of the OpenMP 4.5 specification the explicit use of array section in the \code{reduction} clause in Fortran is not permitted. But this oversight will be fixed in the next release of the specification. +The following example demonstrates the reduction of array \plc{a}. In C/C++ this is illustrated by the explicit use of an array section \plc{a[0:N]} in the \code{reduction} clause. The corresponding Fortran example uses array syntax supported in the base language. As of the OpenMP 4.5 specification the explicit use of array section in the \code{reduction} clause in Fortran is not permitted. But this oversight has been fixed in the OpenMP 5.0 specification. -\cexample{reduction}{7} +\cexample[4.5]{reduction}{7} \ffreeexample{reduction}{7} - \subsection{Task Reduction} \label{subsec:task_reduction} -The following C/C++ and Fortran examples show how to implement -a task reduction over a linked list. +In OpenMP 5.0 the \code{task\_reduction} clause was created for the \code{taskgroup} construct, +to allow reductions among explicit tasks that have an \code{in\_reduction} clause. -Task reductions are supported by the \code{task\_reduction} clause which can only be -applied to the \code{taskgroup} directive, and a \code{in\_reduction} clause -which can be applied to the \code{task} construct among others. - -The \code{task\_reduction} clause on the \code{taskgroup} construct is used to -define the scope of a new reduction, and after the \code{taskgroup} -region the original variable will contain the final value of the reduction. -In the task-generating while loop the \code{in\_reduction} clause of the \code{task} -construct is used to specify that the task participates "in" the reduction. +In the \plc{task\_reduction.1} example below a reduction is performed as the algorithm +traverses a linked list. The reduction statement is assigned to be an explicit task using +a \code{task} construct and is specified to be a reduction participant with +the \code{in\_reduction} clause. +A \code{taskgroup} construct encloses the tasks participating in the reduction, and +specifies, with the \code{task\_reduction} clause, that the taskgroup has tasks participating +in a reduction. After the \code{taskgroup} region the original variable will contain +the final value of the reduction. Note: The \plc{res} variable is private in the \plc{linked\_list\_sum} routine and is not required to be shared (as in the case of a \code{parallel} construct reduction). -\cexample{task_reduction}{1} +\cexample[5.0]{task_reduction}{1} -\ffreeexample{task_reduction}{1} +\ffreeexample[5.0]{task_reduction}{1} + +In OpenMP 5.0 the \code{task} \plc{reduction-modifier} for the \code{reduction} clause was +introduced to provide a means of performing reductions among implicit and explicit tasks. + +The \code{reduction} clause of a \code{parallel} or worksharing construct may +specify the \code{task} \plc{reduction-modifier} to include explicit task reductions +within their region, provided the reduction operators (\plc{reduction-identifiers}) +and variables (\plc{list items}) of the participating tasks match those of the +implicit tasks. + +There are 2 reduction use cases (identified by USE CASE \#) in the \plc{task\_reduction.2} example below. + +In USE CASE 1 a \code{task} modifier in the \code{reduction} clause +of the \code{parallel} construct is used to include the reductions of any +participating tasks, those with an \code{in\_reduction} clause and matching +\plc{reduction-identifiers} (\code{+}) and list items (\code{x}). + +Note, a \code{taskgroup} construct (with a \code{task\_reduction} clause) in not +necessary to scope the explicit task reduction (as seen in the example above). +Hence, even without the implicit task reduction statement (without the C \code{x++\;} +and Fortran \code{x=x+1} statements), the \code{task} \plc{reduction-modifier} +in a \code{reduction} clause of the \code{parallel} construct +can be used to avoid having to create a \code{taskgroup} construct +(and its \code{task\_reduction} clause) around the task generating structure. + +In USE CASE 2 tasks participating in the reduction are within a +worksharing region (a parallel worksharing-loop construct). +Here, too, no \code{taskgroup} is required, and the \plc{reduction-identifier} (\code{+}) +and list item (variable \code{x}) match as required. + + +\cexample[5.0]{task_reduction}{2} + +\ffreeexample[5.0]{task_reduction}{2} + + +\subsection{Reduction on Combined Target Constructs} +\label{subsec:target_reduction} + +When a \code{reduction} clause appears on a combined construct that combines +a \code{target} construct with another construct, there is an implicit map +of the list items with a \code{tofrom} map type for the \code{target} construct. +Otherwise, the list items (if they are scalar variables) would be +treated as firstprivate by default in the \code{target} construct, which +is unlikely to provide the intended behavior since the result of the +reduction that is in the firstprivate variable would be discarded +at the end of the \code{target} region. + +In the following example, the use of the \code{reduction} clause on \code{sum1} +or \code{sum2} should, by default, result in an implicit \code{tofrom} map for +that variable. So long as neither \code{sum1} nor \code{sum2} were already +present on the device, the mapping behavior ensures the value for +\code{sum1} computed in the first \code{target} construct is used in the +second \code{target} construct. + +\cexample[5.0]{target_reduction}{1} + +\ffreeexample[5.0]{target_reduction}{1} +\clearpage + +In next example, the variables \code{sum1} and \code{sum2} remain on the +device for the duration of the \code{target}~\code{data} region so that it is +their device copies that are updated by the reductions. Note the significance +of mapping \code{sum1} on the second \code{target} construct; otherwise, it +would be treated by default as firstprivate and the result computed for +\code{sum1} in the prior \code{target} region may not be used. Alternatively, a +\code{target}~\code{update} construct could be used between the two +\code{target} constructs to update the host version of \code{sum1} with the +value that is in the corresponding device version after the completion of the +first construct. + +\cexample[5.0]{target_reduction}{2} + +\ffreeexample[5.0]{target_reduction}{2} + + +\subsection{Task Reduction with Target Constructs} +\label{subsec:target_task_reduction} + +The following examples illustrate how task reductions can apply to target tasks +that result from a \code{target} construct with the \code{in\_reduction} +clause. Here, the \code{in\_reduction} clause specifies that the target task +participates in the task reduction defined in the scope of the enclosing +\code{taskgroup} construct. Partial results from all tasks participating in the +task reduction will be combined (in some order) into the original variable +listed in the \code{task\_reduction} clause before exiting the \code{taskgroup} +region. + +\cexample[5.0]{target_task_reduction}{1} + +\ffreeexample[5.0]{target_task_reduction}{1} + +In the next pair of examples, the task reduction is defined by a +\code{reduction} clause with the \code{task} modifier, rather than a +\code{task\_reduction} clause on a \code{taskgroup} construct. Again, the +partial results from the participating tasks will be combined in some order +into the original reduction variable, \code{sum}. + +\cexample[5.0]{target_task_reduction}{2a} + +\ffreeexample[5.0]{target_task_reduction}{2a} + +Next, the \code{task} modifier is again used to define a task reduction over +participating tasks. This time, the participating tasks are a target task +resulting from a \code{target} construct with the \code{in\_reduction} clause, +and the implicit task (executing on the master thread) that calls +\code{host\_compute}. As before, the partial results from these paricipating +tasks are combined in some order into the original reduction variable. + +\cexample[5.0]{target_task_reduction}{2b} + +\ffreeexample[5.0]{target_task_reduction}{2b} \subsection{Taskloop Reduction} @@ -121,8 +231,8 @@ that if we add the \code{nogroup} clause to the \code{taskloop} construct the co nonconforming, basically because we have a set of tasks that participate in a reduction that has not been defined. -\cexample{taskloop_reduction}{1} -\ffreeexample{taskloop_reduction}{1} +\cexample[5.0]{taskloop_reduction}{1} +\ffreeexample[5.0]{taskloop_reduction}{1} %In the second example, we are computing exactly the same %value but we do it in a very different way. The first thing that we do in the @@ -154,8 +264,9 @@ declared reduction (\code{in\_reduction} clause) whereas in the other case creation of a new reduction is specified and also that all tasks generated by the taskloop will participate on it. -\cexample{taskloop_reduction}{2} -\ffreeexample{taskloop_reduction}{2} +\cexample[5.0]{taskloop_reduction}{2} +\ffreeexample[5.0]{taskloop_reduction}{2} +\clearpage In the OpenMP 5.0 Specification, \code{reduction} clauses for the \code{taskloop}~\code{ simd} construct were also added. @@ -228,10 +339,8 @@ At the end of the parallel region \plc{asum} contains the combined result of all %At the end of the parallel region \plc{asum} contains the combined result of all reductions. -\cexample{taskloop_simd_reduction}{1} +\cexample[5.0]{taskloop_simd_reduction}{1} -\ffreeexample{taskloop_simd_reduction}{1} +\ffreeexample[5.0]{taskloop_simd_reduction}{1} - -% All other reductions diff --git a/Examples_requires.tex b/Examples_requires.tex index 334e481..b53b399 100644 --- a/Examples_requires.tex +++ b/Examples_requires.tex @@ -26,6 +26,6 @@ not updated on the host. %\pagebreak -\cppexample{requires}{1} +\cppexample[5.0]{requires}{1} -\ffreeexample{requires}{1} +\ffreeexample[5.0]{requires}{1} diff --git a/Examples_scan.tex b/Examples_scan.tex new file mode 100644 index 0000000..4ba3232 --- /dev/null +++ b/Examples_scan.tex @@ -0,0 +1,38 @@ +\pagebreak +\section{The \code{scan} Directive} +\label{sec:scan} + +The following examples illustrate how to parallelize a loop that saves +the \emph{prefix sum} of a reduction. This is accomplished by using +the \code{inscan} modifier in the \code{reduction} clause for the input +variable of the scan, and specifying with a \code{scan} directive whether +the storage statement includes or excludes the scan input of the present +iteration (\texttt{k}). + +Basically, the \code{inscan} modifier connects a loop and/or SIMD reduction to +the scan operation, and a \code{scan} construct with an \code{inclusive} or +\code{exclusive} clause specifies whether the ``scan phase'' (lexical block +before and after the directive, respectively) is to use an \plc{inclusive} or +\plc{exclusive} scan value for the list item (\texttt{x}). + +The first example uses the \plc{inclusive} scan operation on a composite +loop-SIMD construct. The \code{scan} directive separates the reduction +statement on variable \texttt{x} from the use of \texttt{x} (saving to array \texttt{b}). +The order of the statements in this example indicates that +value \texttt{a[k]} (\texttt{a(k)} in Fortran) is included in the computation of +the prefix sum \texttt{b[k]} (\texttt{b(k)} in Fortran) for iteration \texttt{k}. + +\cexample[5.0]{scan}{1} + +\ffreeexample[5.0]{scan}{1} + +The second example uses the \plc{exclusive} scan operation on a composite +loop-SIMD construct. The \code{scan} directive separates the use of \texttt{x} +(saving to array \texttt{b}) from the reduction statement on variable \texttt{x}. +The order of the statements in this example indicates that +value \texttt{a[k]} (\texttt{a(k)} in Fortran) is excluded from the computation +of the prefix sum \texttt{b[k]} (\texttt{b(k)} in Fortran) for iteration \texttt{k}. + +\cexample[5.0]{scan}{2} + +\ffreeexample[5.0]{scan}{2} diff --git a/Examples_standalone.tex b/Examples_standalone.tex index 01013ff..4b6a60b 100644 --- a/Examples_standalone.tex +++ b/Examples_standalone.tex @@ -7,7 +7,7 @@ The following example is non-conforming, because the \code{flush}, \code{barrier \code{taskwait}, and \code{taskyield} directives are stand-alone directives and cannot be the immediate substatement of an \code{if} statement. -\cexample{standalone}{1} +\cexample[3.1]{standalone}{1} \pagebreak The following example is non-conforming, because the \code{flush}, \code{barrier}, @@ -15,19 +15,19 @@ The following example is non-conforming, because the \code{flush}, \code{barrier and cannot be the action statement of an \code{if} statement or a labeled branch target. -\ffreeexample{standalone}{1} +\ffreeexample[3.1]{standalone}{1} The following version of the above example is conforming because the \code{flush}, \code{barrier}, \code{taskwait}, and \code{taskyield} directives are enclosed in a compound statement. -\cexample{standalone}{2} +\cexample[3.1]{standalone}{2} \pagebreak The following example is conforming because the \code{flush}, \code{barrier}, \code{taskwait}, and \code{taskyield} directives are enclosed in an \code{if} construct or follow the labeled branch target. -\ffreeexample{standalone}{2} +\ffreeexample[3.1]{standalone}{2} diff --git a/Examples_target.tex b/Examples_target.tex index d04fbeb..0e31ceb 100644 --- a/Examples_target.tex +++ b/Examples_target.tex @@ -9,9 +9,9 @@ This following example shows how the \code{target} construct offloads a code region to a target device. The variables \plc{p}, \plc{v1}, \plc{v2}, and \plc{N} are implicitly mapped to the target device. -\cexample{target}{1} +\cexample[4.0]{target}{1} -\ffreeexample{target}{1} +\ffreeexample[4.0]{target}{1} \subsection{\code{target} Construct with \code{map} Clause} \label{subsec:target_map} @@ -21,9 +21,9 @@ region to a target device. The variables \plc{p}, \plc{v1} and \plc{v2} are expl target device using the \code{map} clause. The variable \plc{N} is implicitly mapped to the target device. -\cexample{target}{2} +\cexample[4.0]{target}{2} -\ffreeexample{target}{2} +\ffreeexample[4.0]{target}{2} \subsection{\code{map} Clause with \code{to}/\code{from} map-types} \label{subsec:target_map_tofrom} @@ -46,14 +46,14 @@ the variable \plc{p} is not initialized with the value of the corresponding vari on the host device, and at the end of the \code{target} region the variable \plc{p} is assigned to the corresponding variable on the host device. -\cexample{target}{3} +\cexample[4.0]{target}{3} The \code{to} and \code{from} map-types allow programmers to optimize data motion. Since data for the \plc{v} arrays are not returned, and data for the \plc{p} array are not transferred to the device, only one-half of the data is moved, compared to the default behavior of an implicit mapping. -\ffreeexample{target}{3} +\ffreeexample[4.0]{target}{3} \subsection{\code{map} Clause with Array Sections} \label{subsec:target_array_section} @@ -64,14 +64,15 @@ the mapping of variables to the target device. Because variables \plc{p}, \plc{v pointers, array section notation must be used to map the arrays. The notation \code{:N} is equivalent to \code{0:N}. -\cexample{target}{4} +\cexample[4.0]{target}{4} +\clearpage In C, the length of the pointed-to array must be specified. In Fortran the extent of the array is known and the length need not be specified. A section of the array can be specified with the usual Fortran syntax, as shown in the following example. The value 1 is assumed for the lower bound for array section \plc{v2(:N)}. -\ffreeexample{target}{4} +\ffreeexample[4.0]{target}{4} A more realistic situation in which an assumed-size array is passed to \code{vec\_mult} requires that the length of the arrays be specified, because the compiler does @@ -79,7 +80,7 @@ not know the size of the storage. A section of the array must be specified with the usual Fortran syntax, as shown in the following example. The value 1 is assumed for the lower bound for array section \plc{v2(:N)}. -\ffreeexample{target}{4b} +\ffreeexample[4.0]{target}{4b} \subsection{\code{target} Construct with \code{if} Clause} \label{subsec:target_if} @@ -95,9 +96,9 @@ The \code{if} clause on the \code{parallel} construct indicates that if the variable \plc{N} is smaller than a second threshold then the \code{parallel} region is inactive. -\cexample{target}{5} +\cexample[4.0]{target}{5} -\ffreeexample{target}{5} +\ffreeexample[4.0]{target}{5} The following example is a modification of the above \plc{target.5} code to show the combined \code{target} and parallel loop directives. It uses the \plc{directive-name} modifier in multiple \code{if} @@ -107,9 +108,9 @@ The \code{if} clause with the \code{target} modifier applies to the \code{target combined directive, and the \code{if} clause with the \code{parallel} modifier applies to the \code{parallel} component of the combined directive. -\cexample{target}{6} +\cexample[4.5]{target}{6} -\ffreeexample{target}{6} +\ffreeexample[4.5]{target}{6} \subsection{target Reverse Offload} \label{subsec:target_reverse_offload} @@ -139,6 +140,6 @@ function. This feature may be necessary if the function exists in another compile unit. -\cexample{target_reverse_offload}{7} +\cexample[5.0]{target_reverse_offload}{7} -\ffreeexample{target_reverse_offload}{7} +\ffreeexample[5.0]{target_reverse_offload}{7} diff --git a/Examples_target_data.tex b/Examples_target_data.tex index 240b394..4af7c39 100644 --- a/Examples_target_data.tex +++ b/Examples_target_data.tex @@ -14,14 +14,14 @@ variables \plc{v1}, \plc{v2}, and \plc{p} from the enclosing device data environ \plc{N} is mapped into the new device data environment from the encountering task's data environment. -\cexample{target_data}{1} +\cexample[4.0]{target_data}{1} \pagebreak The Fortran code passes a reference and specifies the extent of the arrays in the declaration. No length information is necessary in the map clause, as is required with C/C++ pointers. -\ffreeexample{target_data}{1} +\ffreeexample[4.0]{target_data}{1} \subsection{\code{target} \code{data} Region Enclosing Multiple \code{target} Regions} \label{subsec:target_data_multiregion} @@ -39,7 +39,7 @@ In the following example the variables \plc{v1} and \plc{v2} are mapped at each construct. Instead of mapping the variable \plc{p} twice, once at each \code{target} construct, \plc{p} is mapped once by the \code{target} \code{data} construct. -\cexample{target_data}{2} +\cexample[4.0]{target_data}{2} The Fortran code uses reference and specifies the extent of the \plc{p}, \plc{v1} and \plc{v2} arrays. @@ -48,7 +48,7 @@ C/C++ pointers. The arrays \plc{v1} and \plc{v2} are mapped at each \code{target Instead of mapping the array \plc{p} twice, once at each target construct, \plc{p} is mapped once by the \code{target} \code{data} construct. -\ffreeexample{target_data}{2} +\ffreeexample[4.0]{target_data}{2} In the following example, the array \plc{Q} is mapped once at the enclosing \code{target}~\code{data} region instead of at each \code{target} construct. @@ -58,9 +58,9 @@ the \code{tofrom} map-type at the first \code{target} construct in order to retu its reduced value from the parallel loop construct to the host. The variable defaults to firstprivate at the second \code{target} construct. -\cexample{target_data}{3} +\cexample[4.0]{target_data}{3} -\ffreeexample{target_data}{3} +\ffreeexample[4.0]{target_data}{3} \subsection{\code{target} \code{data} Construct with Orphaned Call} @@ -87,7 +87,7 @@ of the storage location associated with their corresponding array sections. Note that the following pairs of array section storage locations are equivalent (\plc{p0[:N]}, \plc{p1[:N]}), (\plc{v1[:N]},\plc{v3[:N]}), and (\plc{v2[:N]},\plc{v4[:N]}). -\cexample{target_data}{4} +\cexample[4.0]{target_data}{4} The Fortran code maps the pointers and storage in an identical manner (same extent, but uses indices from 1 to \plc{N}). @@ -103,7 +103,7 @@ assigned the address of the storage location associated with their corresponding array sections. Note that the following pair of array storage locations are equivalent (\plc{p0},\plc{p1}), (\plc{v1},\plc{v3}), and (\plc{v2},\plc{v4}). -\ffreeexample{target_data}{4} +\ffreeexample[4.0]{target_data}{4} In the following example, the variables \plc{p1}, \plc{v3}, and \plc{v4} are references to the pointer @@ -112,7 +112,7 @@ environment inherits the pointer variables \plc{p0}, \plc{v1}, and \plc{v2} from \code{data} construct's device data environment. Thus, \plc{p1}, \plc{v3}, and \plc{v4} are already present in the device data environment. -\cppexample{target_data}{5} +\cppexample[4.0]{target_data}{5} In the following example, the usual Fortran approach is used for dynamic memory. The \plc{p0}, \plc{v1}, and \plc{v2} arrays are allocated in the main program and passed as references @@ -122,7 +122,7 @@ environment inherits the arrays \plc{p0}, \plc{v1}, and \plc{v2} from the enclos device data environment. Thus, \plc{p1}, \plc{v3}, and \plc{v4} are already present in the device data environment. -\ffreeexample{target_data}{5} +\ffreeexample[4.0]{target_data}{5} \subsection{\code{target} \code{data} Construct with \code{if} Clause} \label{subsec:target_data_if} @@ -140,7 +140,7 @@ variable \plc{p} is implicitly mapped with a map-type of \code{tofrom}, but the location for the array section \plc{p[0:N]} will not be mapped in the device data environments of the \code{target} constructs. -\cexample{target_data}{6} +\cexample[4.0]{target_data}{6} \pagebreak The \code{if} clauses work the same way for the following Fortran code. The \code{target} @@ -149,7 +149,7 @@ an \code{if} clause with the same condition, so that the \code{target} \code{dat region and the \code{target} region are either both created for the device, or are both ignored. -\ffreeexample{target_data}{6} +\ffreeexample[4.0]{target_data}{6} \pagebreak In the following example, when the \code{if} clause conditional expression on @@ -161,7 +161,7 @@ region the array section \plc{p[0:N]} will be assigned from the device data envi to the corresponding variable in the data environment of the task that encountered the \code{target} \code{data} construct, resulting in undefined values in \plc{p[0:N]}. -\cexample{target_data}{7} +\cexample[4.0]{target_data}{7} \pagebreak The \code{if} clauses work the same way for the following Fortran code. When @@ -174,5 +174,5 @@ region the \plc{p} array will be assigned from the device data environment to th variable in the data environment of the task that encountered the \code{target} \code{data} construct, resulting in undefined values in \plc{p}. -\ffreeexample{target_data}{7} +\ffreeexample[4.0]{target_data}{7} diff --git a/Examples_target_defaultmap.tex b/Examples_target_defaultmap.tex new file mode 100644 index 0000000..2e48fbc --- /dev/null +++ b/Examples_target_defaultmap.tex @@ -0,0 +1,56 @@ +\pagebreak +\section{\code{defaultmap} Clause} +\label{sec:defaultmap} + +The implicitly-determined, data-mapping and data-sharing attribute +rules of variables referenced in a \code{target} construct can be +changed by the \code{defaultmap} clause introduced in OpenMP 5.0. +The implicit behavior is specified as +\code{alloc}, \code{to}, \code{from}, \code{tofrom}, +\code{firstprivate}, \code{none}, \code{default} or \code{present}, +and is applied to a variable-category, where +\code{scalar}, \code{aggregate}, \code{allocatable}, +and \code{pointer} are the variable categories. + +In OpenMP, a ``category'' has a common data-mapping and data-sharing +behavior for variable types within the category. +In C/C++, \code{scalar} refers to base-language scalar variables, except pointers. +In Fortran it refers to a scalar variable, as defined by the base language, +with intrinsic type, and excludes character type. + +Also, \code{aggregate} refers to arrays and structures (C/C++) and +derived types (Fortran). Fortran has the additional category of \code{allocatable}. + +%In the example below, the first \code{target} construct uses \code{defaultmap} +%clauses to explicitly set data-mapping attributes that reproduce +%the default implicit mapping (data-mapping and data-sharing attributes). That is, +%if the \code{defaultmap} clauses were removed, the results would be identical. +In the example below, the first \code{target} construct uses \code{defaultmap} +clauses to set data-mapping and possibly data-sharing attributes that reproduce +the default implicit mapping (data-mapping and data-sharing attributes). That is, +if the \code{defaultmap} clauses were removed, the results would be identical. + +In the second \code{target} construct all implicit behavior is removed +by specifying the \code{none} implicit behavior in the \code{defaultmap} clause. +Hence, all variables must be explicitly mapped. +In the C/C++ code a scalar (\texttt{s}), an array (\texttt{A}) and a structure +(\texttt{S}) are explicitly mapped \code{tofrom}. +The Fortran code uses a derived type (\texttt{D}) in lieu of structure. + +The third \code{target} construct shows another usual case for using the \code{defaultmap} clause. +The default mapping for (non-pointer) scalar variables is specified as \code{tofrom}. +Here, the default implicit mapping for \texttt{s3} is \code{tofrom} as specified +in the \code{defaultmap} clause, and \texttt{s1} and \texttt{s2} are explicitly +mapped with the \code{firstprivate} data-sharing attribute. + +In the fourth \code{target} construct all arrays, structures (C/C++) and derived +types (Fortran) are mapped with \code{firstprivate} data-sharing behavior by a +\code{defaultmap} clause with an \code{aggregate} variable category. +For the \texttt{H} allocated array in the Fortran code, the \code{allocable} +category must be used in a separate \code{defaultmap} clause to acquire +\code{firsprivate} data-sharing behavior (\texttt{H} has the Fortran allocatable attribute). +% (Common use cases for C/C++ heap storage can be found in \specref{sec:pointer_mapping}.) + +\cexample[5.0]{target_defaultmap}{1} + +\ffreeexample[5.0]{target_defaultmap}{1} diff --git a/Examples_target_mapper.tex b/Examples_target_mapper.tex index 2e42d09..272c259 100644 --- a/Examples_target_mapper.tex +++ b/Examples_target_mapper.tex @@ -26,11 +26,11 @@ full structure, plus the dynamic storage of the \plc{data} element. %The associated Fortran allocatable \plc{data} array is automatically mapped with the derived %type, it does not require an array section as in the C/C++ example. -\cexample{target_mapper}{1} +\cexample[5.0]{target_mapper}{1} -\ffreeexample{target_mapper}{1} +\ffreeexample[5.0]{target_mapper}{1} -\pagebreak +%\pagebreak The next example illustrates the use of the \plc{mapper-identifier} and deep copy within a structure. The structure, \plc{dzmat\_t}, represents a complex matrix, with separate real (\plc{r\_m}) and imaginary (\plc{i\_m}) elements. @@ -56,11 +56,11 @@ Note, the \plc{is} and \plc{ie} scalars are firstprivate by default for a target region, but are declared firstprivate anyway to remind the user of important firstprivate data-sharing properties required here. -\cexample{target_mapper}{2} +\cexample[5.0]{target_mapper}{2} -\ffreeexample{target_mapper}{2} +\ffreeexample[5.0]{target_mapper}{2} -\pagebreak +%\pagebreak In the third example \plc{myvec} structures are nested within a \plc{mypoints} structure. The \plc{myvec\_t} type is mapped as in the first example. Following the \plc{mypoints} structure declaration, @@ -80,7 +80,7 @@ type structure. %Note, in the main program \plc{P} is an array of \plc{mypoints\_t} type structures, %and hence every element of the array is mapped with the mapper prescription. -\cexample{target_mapper}{3} +\cexample[5.0]{target_mapper}{3} -\ffreeexample{target_mapper}{3} +\ffreeexample[5.0]{target_mapper}{3} diff --git a/Examples_target_offload.tex b/Examples_target_offload.tex index ddd3926..995f300 100644 --- a/Examples_target_offload.tex +++ b/Examples_target_offload.tex @@ -34,10 +34,10 @@ when the \code{OMP\_DISPLAY\_ENV} environment variable is set to \code{TRUE} or \code{VERBOSE}. %\pagebreak -\cexample{target_offload_control}{1} +\cexample[5.0]{target_offload_control}{1} %\pagebreak -\ffreeexample{target_offload_control}{1} +\ffreeexample[5.0]{target_offload_control}{1} % OMP 4.5 target offload 15:9-11 diff --git a/Examples_target_pointer_mapping.tex b/Examples_target_pointer_mapping.tex index 79798e7..de44201 100644 --- a/Examples_target_pointer_mapping.tex +++ b/Examples_target_pointer_mapping.tex @@ -2,6 +2,23 @@ \section{Pointer mapping} \label{sec:pointer_mapping} +Pointers that contain host addresses require that those addresses are translated to device addresses for them to be useful in the context of a device data environment. Broadly speaking, there are two scenarios where this is important. + +The first scenario is where the pointer is mapped to the device data environment, such that references to the pointer inside a \code{target} region are to the corresponding pointer. Pointer attachment ensures that the corresponding pointer will contain a device address when all of the following conditions are true: +\begin{itemize} + \item the pointer is mapped by directive $A$ to a device; + \item a list item that uses the pointer as its base pointer (call it the \emph{pointee}) is mapped, to the same device, by directive $B$, which may be the same as $A$; + \item the effect of directive $B$ is to create either the corresponding pointer or pointee in the device data environment of the device. +\end{itemize} + +Given the above conditions, pointer attachment is initiated as a result of directive $B$ and subsequent references to the pointee list item in a target region that use the pointer will access the corresponding pointee. The corresponding pointer remains in this \emph{attached} state until it is removed from the device data environment. + +The second scenario, which is only applicable for C/C++, is where the pointer is implicitly privatized inside a \code{target} construct when it appears as the base pointer to a list item on the construct and does not appear explicitly as a list item in a \code{map} clause, \code{is\_device\_ptr} clause, or data-sharing attribute clause. This scenario can be further split into two cases: the list item is a zero-length array section (e.g., \plc{p[:0]}) or it is not. + +If it is a zero-length array section, this will trigger a runtime check on entry to the \code{target} region for a previously mapped list item where the value of the pointer falls within the range of its base address and ending address. If such a match is found the private pointer is initialized to the device address corresponding to the value of the original pointer, and otherwise it is initialized to NULL (or retains its original value if the \code{unified\_address} requirement is specified for that compilation unit). + +If the list item (again, call it the \emph{pointee}) is not a zero-length array section, the private pointer will be initialized such that references in the \code{target} region to the pointee list item that use the pointer will access the corresponding pointee. + The following example shows the basics of mapping pointers with and without associated storage on the host. @@ -24,18 +41,23 @@ data at the end of the \code{target} region. As a comparison, note that the \plc{aray} array is automatically mapped, since the compiler knows the extent of the array. -The pointer \plc{ptr3} is used in the \code{target} region and has -a data-sharing attribute of firstprivate. -The pointer is implicitly mapped to a zero-length array section. -Neither the pointer address nor any -of its locally assigned data on the device is returned -to the host. +The pointer \plc{ptr3} is used inside the \code{target} construct, but it does +not appear in a data-mapping or data-sharing clause. Nor is there a +\code{defaultmap} clause on the construct to indicate what its implicit +data-mapping or data-sharing attribute should be. For such a case, \plc{ptr3} +will be implicitly privatized within the construct and there will be a runtime +check to see if the host memory to which it is pointing has corresponding memory +in the device data environment. If this runtime check passes, the private +\plc{ptr3} would be initialized to point to the corresponding memory. But in +this case the check does not pass and so it is initialized to null. +Since \plc{ptr3} is private, the value to which it is assigned in the +\code{target} region is not returned into the original \plc{ptr3} on the host. -\cexample{target_ptr_map}{1} +\cexample[5.0]{target_ptr_map}{1} In the following example the global pointer \plc{p} appears in a \code{declare}~\code{target} directive. Hence, the pointer \plc{p} will -persist on the device throughout executions in all target regions. +persist on the device throughout executions in all \code{target} regions. The pointer is also used in an array section of a \code{map} clause on a \code{target} construct. When storage associated with @@ -50,4 +72,49 @@ pointer on the device is \emph{attached}.) % For globals with declare target is there such a things a % original and corresponding? -\cexample{target_ptr_map}{2} +\cexample[5.0]{target_ptr_map}{2} + +The following two examples illustrate subtle differences in pointer attachment +to device address because of the order of data mapping. + +In example \plc{target\_ptr\_map.3a} +the global pointer \plc{p1} points to array \plc{x} and \plc{p2} points to +array \plc{y} on the host. +The array section \plc{x[:N]} is mapped by the \code{target}~\code{enter}~\code{data} directive while array \plc{y} is mapped +on the \code{target} construct. +Since the \code{declare}~\code{target} directive is applied to the declaration +of \plc{p1}, \plc{p1} is a treated like a mapped variable on the \code{target} +construct and references to \plc{p1} inside the construct will be to the +corresponding \plc{p1} that exists on the device. However, the corresponding +\plc{p1} will be undefined since there is no pointer attachment for it. Pointer +attachment for \plc{p1} would require that (1) \plc{p1} (or an lvalue +expression that refers to the same storage as \plc{p1}) appears as a base +pointer to a list item in a \code{map} clause, and (2) the construct that has +the \code{map} clause causes the list item to transition from \emph{not mapped} +to \emph{mapped}. The conditions are clearly not satisifed for this example. + +The problem for \plc{p2} in this example is also subtle. It will be privatized +inside the \code{target} construct, with a runtime check for whether the memory +to which it is pointing has corresponding memory that is accessible on the +device. If this check is successful then the \plc{p2} inside the construct +would be appropriately initialized to point to that corresponding memory. +Unfortunately, despite there being an implicit map of the array \plc{y} (to +which \plc{p2} is pointing) on the construct, the order of this map relative to +the initialization of \plc{p2} is unspecified. Therefore, the initial value of +\plc{p2} will also be undefined. + +Thus, referencing values via either \plc{p1} or \plc{p2} inside +the \code{target} region would be invalid. + +\cexample[5.0]{target_ptr_map}{3a} + +In example \plc{target\_ptr\_map.3b} the mapping orders for arrays \plc{x} +and \plc{y} were rearranged to allow proper pointer attachments. +On the \code{target} construct, the \code{map(x)} clause triggers pointer +attachment for \plc{p1} to the device address of \plc{x}. +Pointer \plc{p2} is assigned the device address of the previously mapped + array \plc{y}. +Referencing values via either \plc{p1} or \plc{p2} inside the \code{target} region is now valid. + +\cexample[5.0]{target_ptr_map}{3b} + diff --git a/Examples_target_structure_mapping.tex b/Examples_target_structure_mapping.tex index 8166caf..9cb52f1 100644 --- a/Examples_target_structure_mapping.tex +++ b/Examples_target_structure_mapping.tex @@ -19,7 +19,7 @@ Note: The buffer arrays and the \plc{x} variable have been grouped together, so the components that will reside on the device are all together (without gaps). This allows the runtime to optimize the transfer and the storage footprint on the device. -\cexample{target_struct_map}{1} +\cexample[5.0]{target_struct_map}{1} %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @@ -28,7 +28,7 @@ a C++ class. In the member function \plc{SAXPY::driver} the array section \plc{p[:N]} is \emph{attached} to the pointer member \plc{p} on the device. -\cppexample{target_struct_map}{2} +\cppexample[5.0]{target_struct_map}{2} %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% diff --git a/Examples_target_unstructured_data.tex b/Examples_target_unstructured_data.tex index 21c1641..898bf29 100644 --- a/Examples_target_unstructured_data.tex +++ b/Examples_target_unstructured_data.tex @@ -22,7 +22,7 @@ back to the host. Note, the stand-alone \code{target}~\code{enter}~\code{data} o after the host vector is created, and the \code{target}~\code{exit}~\code{data} construct occurs before the host data is deleted. -\cppexample{target_unstructured_data}{1} +\cppexample[4.5]{target_unstructured_data}{1} \pagebreak The following C code allocates and frees the data member of a Matrix structure. @@ -33,7 +33,7 @@ and then frees the memory on the host. Note, the stand-alone \code{target}~\code{enter}~\code{data} occurs after the host memory is allocated, and the \code{target}~\code{exit}~\code{data} construct occurs before the host data is freed. -\cexample{target_unstructured_data}{1} +\cexample[4.5]{target_unstructured_data}{1} \pagebreak The following Fortran code allocates and deallocates a module array. The @@ -44,6 +44,6 @@ then deallocates the array on the host. Note, the stand-alone \code{target}~\code{enter}~\code{data} occurs after the host memory is allocated, and the \code{target}~\code{exit}~\code{data} construct occurs before the host data is deallocated. -\ffreeexample{target_unstructured_data}{1} +\ffreeexample[4.5]{target_unstructured_data}{1} %end diff --git a/Examples_target_update.tex b/Examples_target_update.tex index e2f4ced..00bcb9c 100644 --- a/Examples_target_update.tex +++ b/Examples_target_update.tex @@ -27,9 +27,9 @@ region and waits for the completion of the region. The second \code{target} region uses the updated values of \plc{v1[:N]} and \plc{v2[:N]}. -\cexample{target_update}{1} +\cexample[4.0]{target_update}{1} -\ffreeexample{target_update}{1} +\ffreeexample[4.0]{target_update}{1} \subsection{\code{target} \code{update} Construct with \code{if} Clause} \label{subsec:target_update_if} @@ -49,7 +49,7 @@ assigns the new values of \plc{v1} and \plc{v2} from the task's data environment mapped array sections in the \code{target} \code{data} construct's device data environment. -\cexample{target_update}{2} +\cexample[4.0]{target_update}{2} -\ffreeexample{target_update}{2} +\ffreeexample[4.0]{target_update}{2} diff --git a/Examples_task_affinity.tex b/Examples_task_affinity.tex index 0542cbe..ddc2695 100644 --- a/Examples_task_affinity.tex +++ b/Examples_task_affinity.tex @@ -26,7 +26,7 @@ The use of the \plc{A} array is sufficient for this case, because one would expect the storage for \plc{A} and \plc{B} would be physically "close" (as provided by the hint in the first task). -\cexample{affinity}{6} +\cexample[5.0]{affinity}{6} -\ffreeexample{affinity}{6} +\ffreeexample[5.0]{affinity}{6} diff --git a/Examples_task_dep.tex b/Examples_task_dep.tex index c26616b..4339428 100644 --- a/Examples_task_dep.tex +++ b/Examples_task_dep.tex @@ -8,9 +8,9 @@ This example shows a simple flow dependence using a \code{depend} clause on the \code{task} construct. -\cexample{task_dep}{1} +\cexample[4.0]{task_dep}{1} -\ffreeexample{task_dep}{1} +\ffreeexample[4.0]{task_dep}{1} The program will always print \texttt{"}x = 2\texttt{"}, because the \code{depend} clauses enforce the ordering of the tasks. If the \code{depend} clauses had been @@ -23,9 +23,9 @@ would have a race condition. This example shows an anti-dependence using the \code{depend} clause on the \code{task} construct. -\cexample{task_dep}{2} +\cexample[4.0]{task_dep}{2} -\ffreeexample{task_dep}{2} +\ffreeexample[4.0]{task_dep}{2} The program will always print \texttt{"}x = 1\texttt{"}, because the \code{depend} clauses enforce the ordering of the tasks. If the \code{depend} clauses had been @@ -38,9 +38,9 @@ race condition. This example shows an output dependence using the \code{depend} clause on the \code{task} construct. -\cexample{task_dep}{3} +\cexample[4.0]{task_dep}{3} -\ffreeexample{task_dep}{3} +\ffreeexample[4.0]{task_dep}{3} The program will always print \texttt{"}x = 2\texttt{"}, because the \code{depend} clauses enforce the ordering of the tasks. If the \code{depend} clauses had been @@ -55,9 +55,9 @@ In this example we show potentially concurrent execution of tasks using multiple flow dependences expressed using the \code{depend} clause on the \code{task} construct. -\cexample{task_dep}{4} +\cexample[4.0]{task_dep}{4} -\ffreeexample{task_dep}{4} +\ffreeexample[4.0]{task_dep}{4} The last two tasks are dependent on the first task. However there is no dependence between the last two tasks, which may execute in any order (or concurrently if @@ -72,9 +72,9 @@ in any order and the program would have a race condition. This example shows a task-based blocked matrix multiplication. Matrices are of NxN elements, and the multiplication is implemented using blocks of BSxBS elements. -\cexample{task_dep}{5} +\cexample[4.0]{task_dep}{5} -\ffreeexample{task_dep}{5} +\ffreeexample[4.0]{task_dep}{5} \subsection{\code{taskwait} with Dependences} \label{subsec:taskwait_depend} @@ -105,9 +105,9 @@ Hence, immediately after the first \code{taskwait} it is unsafe to access the The second \code{taskwait} ensures that the second child task has completed; hence it is safe to access the \plc{y} variable in the following print statement. -\cexample{task_dep}{6} +\cexample[5.0]{task_dep}{6} -\ffreeexample{task_dep}{6} +\ffreeexample[5.0]{task_dep}{6} In this example the first two tasks are serialized, because a dependence on the first child is produced by \plc{x} with the \code{in} dependence type @@ -123,9 +123,9 @@ included to illustrate how the child task dependences can be completely annotate in a data-flow model.) -\cexample{task_dep}{7} +\cexample[5.0]{task_dep}{7} -\ffreeexample{task_dep}{7} +\ffreeexample[5.0]{task_dep}{7} This example is similar to the previous one, except the generating task is @@ -149,9 +149,9 @@ the dependence type of variables in the \code{taskwait} \code{depend} clause when selecting child tasks that the generating task must wait on, so that its execution after the taskwait does not produce race conditions on variables accessed by non-completed child tasks. -\cexample{task_dep}{8} +\cexample[5.0]{task_dep}{8} -\ffreeexample{task_dep}{8} +\ffreeexample[5.0]{task_dep}{8} \pagebreak \subsection{Mutually Exclusive Execution with Dependences} @@ -168,18 +168,18 @@ to the \code{mutexinoutset} dependence type on \code{c}, T4 and T5 may be scheduled in any order with respect to each other, but not at the same time. Tasks T6 will be scheduled after both T4 and T5 are completed. -\cexample{task_dep}{9} +\cexample[5.0]{task_dep}{9} -\ffreeexample{task_dep}{9} +\ffreeexample[5.0]{task_dep}{9} The following example demonstrates a situation where the \code{mutexinoutset} dependence type is advantageous. If \code{shortTaskB} completes before \code{longTaskA}, the runtime can take advantage of this by scheduling \code{longTaskBC} before \code{shortTaskAC}. -\cexample{task_dep}{10} +\cexample[5.0]{task_dep}{10} -\ffreeexample{task_dep}{10} +\ffreeexample[5.0]{task_dep}{10} \subsection{Multidependences Using Iterators} \label{subsec:depend_iterator} @@ -211,6 +211,31 @@ identical nor disjoint to the storage prescibed by the elements of the loop tasks. The iterator overcomes this restriction by effectively creating n disjoint storage areas. -\cexample{task_dep}{11} +\cexample[5.0]{task_dep}{11} + +\ffreeexample[5.0]{task_dep}{11} + +\subsection{Dependence for Undeferred Tasks} +\label{subsec:depend_undefer_task} + +In the following example, we show that even if a task is undeferred as specified +by an \code{if} clause that evaluates to \plc{false}, task dependences are +still honored. + +The \code{depend} clauses of the first and second explicit tasks specify that +the first task is completed before the second task. + +The second explicit task has an \code{if} clause that evaluates to \plc{false}. +This means that the execution of the generating task (the implicit task of +the \code{single} region) must be suspended until the second explict task +is completed. +But, because of the dependence, the first explicit task must complete first, +then the second explicit task can execute and complete, and only then +the generating task can resume to the print statement. +Thus, the program will always print "\texttt{x = 2}". + +\cexample[4.0]{task_dep}{12} +\clearpage + +\ffreeexample[4.0]{task_dep}{12} -\ffreeexample{task_dep}{11} diff --git a/Examples_task_priority.tex b/Examples_task_priority.tex index 734efc2..75dd262 100644 --- a/Examples_task_priority.tex +++ b/Examples_task_priority.tex @@ -16,7 +16,7 @@ The creation of tasks occurs in ascending order (according to the iteration spac the loop) but a hint, by means of the \code{priority} clause, is provided to reverse the execution order. -\cexample{task_priority}{1} +\cexample[4.5]{task_priority}{1} -\ffreeexample{task_priority}{1} +\ffreeexample[4.5]{task_priority}{1} diff --git a/Examples_taskgroup.tex b/Examples_taskgroup.tex index 3e06831..5b0579a 100644 --- a/Examples_taskgroup.tex +++ b/Examples_taskgroup.tex @@ -14,7 +14,7 @@ does not participate in the synchronization, and is left free to execute in para This is opposed to the behavior of the \code{taskwait} construct, which would include the background tasks in the synchronization. -\cexample{taskgroup}{1} +\cexample[4.0]{taskgroup}{1} -\ffreeexample{taskgroup}{1} +\ffreeexample[4.0]{taskgroup}{1} diff --git a/Examples_tasking.tex b/Examples_tasking.tex index e926c42..ec44c0d 100644 --- a/Examples_tasking.tex +++ b/Examples_tasking.tex @@ -9,17 +9,17 @@ note that the tasks will be executed in no specified order because there are no synchronization directives. Thus, assuming that the traversal will be done in post order, as in the sequential code, is wrong. -\cexample{tasking}{1} +\cexample[3.0]{tasking}{1} -\ffreeexample{tasking}{1} +\ffreeexample[3.0]{tasking}{1} In the next example, we force a postorder traversal of the tree by adding a \code{taskwait} directive. Now, we can safely assume that the left and right sons have been executed before we process the current node. -\cexample{tasking}{2} +\cexample[3.0]{tasking}{2} -\ffreeexample{tasking}{2} +\ffreeexample[3.0]{tasking}{2} The following example demonstrates how to use the \code{task} construct to process elements of a linked list in parallel. The thread executing the \code{single} @@ -28,18 +28,19 @@ in the current team. The pointer \plc{p} is \code{firstprivate} by default on the \code{task} construct so it is not necessary to specify it in a \code{firstprivate} clause. -\cexample{tasking}{3} +\cexample[3.0]{tasking}{3} -\ffreeexample{tasking}{3} +\ffreeexample[3.0]{tasking}{3} The \code{fib()} function should be called from within a \code{parallel} region for the different specified tasks to be executed in parallel. Also, only one thread of the \code{parallel} region should call \code{fib()} unless multiple concurrent Fibonacci computations are desired. -\cexample{tasking}{4} +\cexample[3.0]{tasking}{4} -\fexample{tasking}{4} +\fexample[3.0]{tasking}{4} +\clearpage Note: There are more efficient algorithms for computing Fibonacci numbers. This classic recursion algorithm is for illustrative purposes. @@ -52,9 +53,9 @@ loop to suspend its task at the task scheduling point in the \code{task} directi and start executing unassigned tasks. Once the number of unassigned tasks is sufficiently low, the thread may resume execution of the task generating loop. -\cexample{tasking}{5} +\cexample[3.0]{tasking}{5} -\fexample{tasking}{5} +\fexample[3.0]{tasking}{5} The following example is the same as the previous one, except that the tasks are generated in an untied task. While generating the tasks, the implementation may @@ -69,9 +70,9 @@ to resume the task generating loop. In the previous examples, the other threads would be forced to idle until the generating thread finishes its long task, since the task generating loop was in a tied task. -\cexample{tasking}{6} +\cexample[3.0]{tasking}{6} -\fexample{tasking}{6} +\fexample[3.0]{tasking}{6} The following two examples demonstrate how the scheduling rules illustrated in Section 2.11.3 of the OpenMP 4.0 specification affect the usage of @@ -86,20 +87,20 @@ both of the task regions that modify \code{tp}. The parts of these task regions in which \code{tp} is modified may be executed in any order so the resulting value of \code{var} can be either 1 or 2. -\cexample{tasking}{7} +\cexample[3.0]{tasking}{7} -\fexample{tasking}{7} +\fexample[3.0]{tasking}{7} In this example, scheduling constraints prohibit a thread in the team from executing a new task that modifies \code{tp} while another such task region tied to the same thread is suspended. Therefore, the value written will persist across the task scheduling point. -\cexample{tasking}{8} +\cexample[3.0]{tasking}{8} -\fexample{tasking}{8} +\fexample[3.0]{tasking}{8} The following two examples demonstrate how the scheduling rules illustrated in Section 2.11.3 of the OpenMP 4.0 specification affect the usage of locks @@ -112,20 +113,20 @@ it encounters the task scheduling point at task 3, it could suspend task 1 and begin task 2 which will result in a deadlock when it tries to enter critical region 1. -\cexample{tasking}{9} +\cexample[3.0]{tasking}{9} -\fexample{tasking}{9} +\fexample[3.0]{tasking}{9} In the following example, \code{lock} is held across a task scheduling point. However, according to the scheduling restrictions, the executing thread can't begin executing one of the non-descendant tasks that also acquires \code{lock} before the task region is complete. Therefore, no deadlock is possible. -\cexample{tasking}{10} +\cexample[3.0]{tasking}{10} - -\ffreeexample{tasking}{10} +\ffreeexample[3.0]{tasking}{10} +\clearpage The following examples illustrate the use of the \code{mergeable} clause in the \code{task} construct. In this first example, the \code{task} construct has @@ -139,9 +140,9 @@ outcome does not depend on whether or not the task is merged (that is, the task will always increment the same variable and will always compute the same value for \code{x}). -\cexample{tasking}{11} +\cexample[3.1]{tasking}{11} -\ffreeexample{tasking}{11} +\ffreeexample[3.1]{tasking}{11} This second example shows an incorrect use of the \code{mergeable} clause. In this example, the created task will access different instances of the variable @@ -150,9 +151,9 @@ it will access the same variable \code{x} if the task is merged. As a result, the behavior of the program is unspecified and it can print two different values for \code{x} depending on the decisions taken by the implementation. -\cexample{tasking}{12} +\cexample[3.1]{tasking}{12} -\ffreeexample{tasking}{12} +\ffreeexample[3.1]{tasking}{12} The following example shows the use of the \code{final} clause and the \code{omp\_in\_final} API call in a recursive binary search program. To reduce overhead, once a certain @@ -170,9 +171,9 @@ in the stack could also be avoided but it would make this example less clear. Th clause since all tasks created in a \code{final} task region are included tasks that can be merged if the \code{mergeable} clause is present. -\cexample{tasking}{13} +\cexample[3.1]{tasking}{13} -\ffreeexample{tasking}{13} +\ffreeexample[3.1]{tasking}{13} The following example illustrates the difference between the \code{if} and the \code{final} clauses. The \code{if} clause has a local effect. In the first @@ -184,7 +185,7 @@ task itself. In the second nest of tasks, the nested tasks will be created as in tasks. Note also that the conditions for the \code{if} and \code{final} clauses are usually the opposite. -\cexample{tasking}{14} +\cexample[3.1]{tasking}{14} -\ffreeexample{tasking}{14} +\ffreeexample[3.1]{tasking}{14} diff --git a/Examples_taskloop.tex b/Examples_taskloop.tex index 9a0ed7c..37bb06c 100644 --- a/Examples_taskloop.tex +++ b/Examples_taskloop.tex @@ -9,9 +9,9 @@ The \code{grainsize} clause specifies that each task is to execute at least 500 The \code{nogroup} clause removes the implicit taskgroup of the \code{taskloop} construct; the explicit \code{taskgroup} construct in the example ensures that the function is not exited before the long-running task and the loops have finished execution. -\cexample{taskloop}{1} +\cexample[4.5]{taskloop}{1} -\ffreeexample{taskloop}{1} +\ffreeexample[4.5]{taskloop}{1} %\clearpage @@ -34,6 +34,6 @@ tasks. This is the common use case for the \code{taskloop} construct.) In the example, the code thus prints \code{x1 = 16384} (\plc{T}*\plc{N}) and \code{x2 = 1024} (\plc{N}). -\cexample{taskloop}{2} +\cexample[4.5]{taskloop}{2} -\ffreeexample{taskloop}{2} +\ffreeexample[4.5]{taskloop}{2} diff --git a/Examples_taskyield.tex b/Examples_taskyield.tex index 4a8eefa..8e2ecc0 100644 --- a/Examples_taskyield.tex +++ b/Examples_taskyield.tex @@ -8,7 +8,7 @@ that must be done in a critical region. By using \code{taskyield} when a task cannot get access to the \code{critical} region the implementation can suspend the current task and schedule some other task that can do something useful. -\cexample{taskyield}{1} +\cexample[3.1]{taskyield}{1} -\ffreeexample{taskyield}{1} +\ffreeexample[3.1]{taskyield}{1} diff --git a/Examples_teams.tex b/Examples_teams.tex index 2a48344..3aef99b 100644 --- a/Examples_teams.tex +++ b/Examples_teams.tex @@ -16,9 +16,9 @@ region. The \code{omp\_get\_team\_num} routine returns the team number, which is between 0 and one less than the value returned by \code{omp\_get\_num\_teams}. The following example manually distributes a loop across two teams. -\cexample{teams}{1} +\cexample[4.0]{teams}{1} -\ffreeexample{teams}{1} +\ffreeexample[4.0]{teams}{1} \subsection{\code{target}, \code{teams}, and \code{distribute} Constructs} \label{subsec:teams_distribute} @@ -47,9 +47,9 @@ created by the \code{teams} construct. At the end of the \code{teams} region, each master thread's private copy of \plc{sum} is reduced into the final \plc{sum} that is implicitly mapped into the \code{target} region. -\cexample{teams}{2} +\cexample[4.0]{teams}{2} -\ffreeexample{teams}{2} +\ffreeexample[4.0]{teams}{2} \subsection{\code{target} \code{teams}, and Distribute Parallel Loop Constructs} \label{subsec:teams_distribute_parallel} @@ -62,9 +62,9 @@ team executes the \code{teams} region. The distribute parallel loop construct schedules the loop iterations across the master threads of each team and then across the threads of each team. -\cexample{teams}{3} +\cexample[4.5]{teams}{3} -\ffreeexample{teams}{3} +\ffreeexample[4.5]{teams}{3} \subsection{\code{target} \code{teams} and Distribute Parallel Loop Constructs with Scheduling Clauses} @@ -87,9 +87,9 @@ The \code{schedule} clause indicates that the 1024 iterations distributed to a master thread are then assigned to the threads in its associated team in chunks of 64 iterations. -\cexample{teams}{4} +\cexample[4.0]{teams}{4} -\ffreeexample{teams}{4} +\ffreeexample[4.0]{teams}{4} \subsection{\code{target} \code{teams} and \code{distribute} \code{simd} Constructs} \label{subsec:teams_distribute_simd} @@ -102,9 +102,9 @@ master thread of each team executes the \code{teams} region. The \code{distribute} \code{simd} construct schedules the loop iterations across the master thread of each team and then uses SIMD parallelism to execute the iterations. -\cexample{teams}{5} +\cexample[4.0]{teams}{5} -\ffreeexample{teams}{5} +\ffreeexample[4.0]{teams}{5} \subsection{\code{target} \code{teams} and Distribute Parallel Loop SIMD Constructs} \label{subsec:teams_distribute_parallel_simd} @@ -118,7 +118,7 @@ The distribute parallel loop SIMD construct schedules the loop iterations across the master thread of each team and then across the threads of each team where each thread uses SIMD parallelism. -\cexample{teams}{6} +\cexample[4.0]{teams}{6} -\ffreeexample{teams}{6} +\ffreeexample[4.0]{teams}{6} diff --git a/Examples_udr.tex b/Examples_udr.tex index a0c57ae..5d577ce 100644 --- a/Examples_udr.tex +++ b/Examples_udr.tex @@ -26,35 +26,36 @@ The initializer of the \code{declare}~\code{reduction} directive specifies the initial value for the private variable of each implicit task. The \code{omp\_priv} identifier is used to denote the private variable. -\cexample{udr}{1} +\cexample[4.0]{udr}{1} +\clearpage The following example shows the corresponding code in Fortran. The \code{declare}~\code{reduction} directives are specified as part of the declaration in subroutine \plc{find\_enclosing\_rectangle} and the procedures that perform the min and max operations are specified as subprograms. -\ffreeexample{udr}{1} +\ffreeexample[4.0]{udr}{1} The following example shows the same computation as \plc{udr.1} but it illustrates that you can craft complex expressions in the user-defined reduction declaration. In this case, instead of calling the \plc{minproc} and \plc{maxproc} functions we inline the code in a single expression. -\cexample{udr}{2} +\cexample[4.0]{udr}{2} The corresponding code of the same example in Fortran is very similar except that the assignment expression in the \code{declare}~\code{reduction} directive can only be used for a single variable, in this case through a type structure constructor \plc{point($\ldots$)}. -\ffreeexample{udr}{2} +\ffreeexample[4.0]{udr}{2} The following example shows the use of special variables in arguments for combiner (\code{omp\_in} and \code{omp\_out}) and initializer (\code{omp\_priv} and \code{omp\_orig}) routines. This example returns the maximum value of an array and the corresponding index value. The \code{declare}~\code{reduction} directive specifies a user-defined reduction operation \plc{maxloc} for data type \plc{struct} \plc{mx\_s}. The function \plc{mx\_combine} is the combiner and the function \plc{mx\_init} is the initializer. -\cexample{udr}{3} +\cexample[4.0]{udr}{3} Below is the corresponding Fortran version of the above example. The \code{declare}~\code{reduction} directive specifies the user-defined operation \plc{maxloc} for user-derived type \plc{mx\_s}. The combiner \plc{mx\_combine} and the initializer \plc{mx\_init} are specified as subprograms. -\ffreeexample{udr}{3} +\ffreeexample[4.0]{udr}{3} The following example explains a few details of the user-defined reduction @@ -74,16 +75,16 @@ has the \code{initializer} clause, the subroutine specified on the clause must be accessible in the current scoping unit. In this case, the subroutine \plc{dt\_init} is accessible by use association. -\ffreeexample{udr}{4} +\ffreeexample[4.0]{udr}{4} The following example uses user-defined reductions to declare a plus (+) reduction for a C++ class. As the \code{declare}~\code{reduction} directive is inside the context of the \plc{V} class the expressions in the \code{declare}~\code{reduction} directive are resolved in the context of the class. Also, note that the \code{initializer} clause uses a copy constructor to initialize the private variables of the reduction and it uses as parameter to its original variable by using the special variable \code{omp\_orig}. -\cppexample{udr}{5} +\cppexample[4.0]{udr}{5} The following examples shows how user-defined reductions can be defined for some STL containers. The first \code{declare}~\code{reduction} defines the plus (+) operation for \plc{std::vector} by making use of the \plc{std::transform} algorithm. The second and third define the merge (or concatenation) operation for \plc{std::vector} and \plc{std::list}. %It shows how the same user-defined reduction operation can be defined to be done differently depending on the specified data type. It shows how the user-defined reduction operation can be applied to specific data types of an STL. -\cppexample{udr}{6} +\cppexample[4.0]{udr}{6} diff --git a/Examples_variant.tex b/Examples_variant.tex index 24e2249..004f6bb 100644 --- a/Examples_variant.tex +++ b/Examples_variant.tex @@ -46,9 +46,9 @@ the purpose of a function variant is to produce the same results by a different %\code{teams distribute simd} in the variant function would produce non conforming code. %\pagebreak -\cexample{declare_variant}{1} +\cexample[5.0]{declare_variant}{1} -\ffreeexample{declare_variant}{1} +\ffreeexample[5.0]{declare_variant}{1} %\pagebreak @@ -72,6 +72,6 @@ containing only a basic \code{parallel}~\code{for} construct is used for the cal %can be found in the allocator example of the Memory Management Chapter. %\pagebreak -\cexample{declare_variant}{2} +\cexample[5.0]{declare_variant}{2} -\ffreeexample{declare_variant}{2} +\ffreeexample[5.0]{declare_variant}{2} diff --git a/Foreword_Chapt.tex b/Foreword_Chapt.tex index 14e1d46..00b452a 100644 --- a/Foreword_Chapt.tex +++ b/Foreword_Chapt.tex @@ -5,11 +5,11 @@ The OpenMP Examples document has been updated with new features found in the OpenMP 5.0 Specification. The additional examples and updates -are referenced in the Document Revision History of the Appendix, \specref{sec:history_45_to_50}. +are referenced in the Document Revision History of the Appendix on page~\pageref{chap:history}. Text describing an example with a 5.0 feature specifically states that the feature support begins in the OpenMP 5.0 Specification. Also, -an \plc{omp\_5.0} keyword has been added to metadata in the source code. +an \code{\small omp\_5.0} keyword has been added to metadata in the source code. These distinctions are presented to remind readers that a 5.0 compliant OpenMP implementation is necessary to use these features in codes. diff --git a/History.tex b/History.tex index 665a42e..2787a36 100644 --- a/History.tex +++ b/History.tex @@ -1,6 +1,46 @@ \chapter{Document Revision History} \label{chap:history} +\section{Changes from 5.0.0 to 5.0.1} +\label{sec:history_50_to_501} + +\begin{itemize} +\item Added version tags (\code{\small{}omp\_}\plc{x.y}) in example labels +and the corresponding source codes for all examples that feature +OpenMP 3.0 and later. + +\item Included additional examples for the 5.0 features: + +\begin{itemize} +\item Extension to the \code{defaultmap} clause +(\specref{sec:defaultmap}) +\item Transferring noncontiguous data with the \code{target}~\code{update} directive in Fortran (\specref{sec:array-shaping}) +\item \code{conditional} modifier for the \code{lastprivate} clause (\specref{sec:lastprivate}) +\item \code{task} modifier for the \code{reduction} clause (\specref{subsec:task_reduction}) +\item Reduction on combined target constructs (\specref{subsec:target_reduction}) +\item Task reduction with target constructs + (\specref{subsec:target_task_reduction}) +\item \code{scan} directive for returning the \emph{prefix sum} of a reduction (\specref{sec:scan}) + +\end{itemize} + +\item Included additional examples for the 4.x features: + +\begin{itemize} +\item Dependence for undeferred tasks +(\specref{subsec:depend_undefer_task}) +\item \code{ref}, \code{val}, \code{uval} modifiers for \code{linear} clause (\specref{sec:linear_modifier}) + +\end{itemize} + +\item Clarified the description of pointer mapping and pointer attachment in +\specref{sec:pointer_mapping}. +\item Clarified the description of memory model examples +in \specref{sec:mem_model}. + +\end{itemize} + + \section{Changes from 4.5.0 to 5.0.0} \label{sec:history_45_to_50} @@ -21,6 +61,8 @@ \item Combined constructs: \code{parallel}~\code{master}~\code{taskloop} and \code{parallel}~\code{master}~\code{taskloop}~\code{simd} (\specref{sec:parallel_master_taskloop}) \item Reverse Offload through \plc{ancestor} modifier of \code{device} clause. (\specref{subsec:target_reverse_offload}) +\item Pointer Mapping - behavior of mapped pointers (\specref{sec:pointer_mapping}) %Example_target_ptr_map* +\item Structure Mapping - behavior of mapped structures (\specref{sec:structure_mapping}) %Examples_target_structure_mapping.tex target_struct_map* \item Array Shaping with the \plc{shape-operator} (\specref{sec:array-shaping}) \item The \code{declare}~\code{mapper} construct (\specref{sec:declare_mapper}) \item Acquire and Release Semantics Synchronization: Memory ordering @@ -36,12 +78,16 @@ \item \code{requires} directive specifies required features of implementation (\specref{sec:requires}) \item \code{declare}~\code{variant} directive - for function variants (\specref{sec:declare_variant}) \item \code{metadirective} directive - for directive variants (\specref{sec:metadirective}) +\item \code{OMP\_TARGET\_OFFLOAD} Environment Variable - controls offload behavior (\specref{sec:target_offload}) \end{itemize} \item Included the following additional examples for the 4.x features: \begin{itemize} \item more taskloop examples (\specref{sec:taskloop}) \item user-defined reduction (UDR) (\specref{subsec:UDR}) +%NEW 5.0 +%\item \code{target} \code{enter} and \code{exit} \code{data} unstructured data constructs (\specref{sec:target_enter_exit_data}) %Example_target_unstructured_data.* ? + \end{itemize} \end{itemize} @@ -101,12 +147,12 @@ Added the following new examples: \begin{itemize} \item task dependences (\specref{sec:task_depend}) \item \code{target} construct (\specref{sec:target}) +\item array sections in device constructs (\specref{sec:array_sections}) \item \code{target}~\code{data} construct (\specref{sec:target_data}) \item \code{target}~\code{update} construct (\specref{sec:target_update}) \item \code{declare}~\code{target} construct (\specref{sec:declare_target}) \item \code{teams} constructs (\specref{sec:teams}) \item asynchronous execution of a \code{target} region using tasks (\specref{subsec:async_target_with_tasks}) -\item array sections in device constructs (\specref{sec:array_sections}) \item device runtime routines (\specref{sec:device}) \item Fortran ASSOCIATE construct (\specref{sec:associate}) \item cancellation constructs (\specref{sec:cancellation}) diff --git a/Makefile b/Makefile index 12530b3..a5522ff 100644 --- a/Makefile +++ b/Makefile @@ -1,8 +1,9 @@ # Makefile for the OpenMP Examples document in LaTex format. # For more information, see the master document, openmp-examples.tex. -version=5.0.0 +version=5.0.1 default: openmp-examples.pdf +diff: openmp-diff-abridged.pdf CHAPTERS=Title_Page.tex \ @@ -25,6 +26,9 @@ INTERMEDIATE_FILES=openmp-examples.pdf \ openmp-examples.out \ openmp-examples.log +# check for branches names with "name_XXX" +DIFF_TICKET_ID=$(shell git rev-parse --abbrev-ref HEAD) + openmp-examples.pdf: $(CHAPTERS) $(SOURCES) openmp.sty openmp-examples.tex openmp-logo.png rm -f $(INTERMEDIATE_FILES) pdflatex -interaction=batchmode -file-line-error openmp-examples.tex @@ -34,4 +38,46 @@ openmp-examples.pdf: $(CHAPTERS) $(SOURCES) openmp.sty openmp-examples.tex openm clean: rm -f $(INTERMEDIATE_FILES) + rm -f openmp-diff-full.pdf openmp-diff-abridged.pdf + rm -rf *.tmpdir +ifdef DIFF_TO + VC_DIFF_TO := -r ${DIFF_TO} +else + VC_DIFF_TO := +endif +ifdef DIFF_FROM + VC_DIFF_FROM := -r ${DIFF_FROM} +else + VC_DIFF_FROM := -r master +endif + +DIFF_TO:=HEAD +DIFF_FROM:=master +DIFF_TYPE:=UNDERLINE + +COMMON_DIFF_OPTS:=--math-markup=whole \ + --append-safecmd=plc,code,hcode,scode,pcode,splc \ + --append-textcmd=subsubsubsection + +VC_DIFF_OPTS:=${COMMON_DIFF_OPTS} --force -c latexdiff.cfg --flatten --type="${DIFF_TYPE}" --git --pdf ${VC_DIFF_FROM} ${VC_DIFF_TO} --subtype=ZLABEL --graphics-markup=none + +VC_DIFF_MINIMAL_OPTS:= --only-changes --force + +%.tmpdir: $(wildcard *.sty) $(wildcard *.png) $(wildcard *.aux) openmp-examples.pdf + mkdir -p $@/sources + mkdir -p $@/figs + cp -f $^ "$@/" + cp -f sources/* "$@/sources" + cp -f figs/* "$@/figs" + +openmp-diff-abridged.pdf: diff-fast-minimal.tmpdir openmp-examples.pdf + env PATH="$(shell pwd)/util/latexdiff:$(PATH)" latexdiff-vc ${VC_DIFF_MINIMAL_OPTS} --fast -d $< ${VC_DIFF_OPTS} openmp-examples.tex + cp $ "name" is the name of an example "type" is the source code type, which can be translated into or from @@ -43,20 +44,27 @@ For copyright information, please see omp_copyright.txt. "rt-error" is for a case where compilation may be successful, but the code contains potential runtime issues (such as race condition). Alternative would be to just use "conforming" or "non-conforming". + "version" indicates features for a specific OpenMP version, such as "omp_5.0" 3) LaTeX macros for examples - Source code with language h-rules - \cexample{}{} % for C/C++ examples - \cppexample{}{} % for C++ examples - \fexample{}{} % for fixed-form Fortran examples - \ffreeexample{}{} % for free-form Fortran examples + \cexample[]{}{} % for C/C++ examples + \cppexample[]{}{} % for C++ examples + \fexample[]{}{} % for fixed-form Fortran examples + \ffreeexample[]{}{} % for free-form Fortran examples - Source code without language h-rules - \cnexample{}{} - \cppnexample{}{} - \fnexample{}{} - \ffreenexample{}{} + \cnexample[]{}{} + \cppnexample[]{}{} + \fnexample[]{}{} + \ffreenexample[]{}{} + + Optional can be supplied in a macro to include a specific OpenMP + version in the example header. This option also suggests one additional + tag (@@version) line is included in the corresponding source code. + If this is not the case (i.e., no @@version tag line), one needs to + prefix with an underscore '_' symbol in the macro. - Language h-rules \cspecificstart, \cspecificend diff --git a/Title_Page.tex b/Title_Page.tex index 13e69aa..0520fce 100644 --- a/Title_Page.tex +++ b/Title_Page.tex @@ -27,7 +27,7 @@ Source codes for OpenMP \PVER{} Examples can be downloaded from \href{https://github.com/OpenMP/Examples/tree/v\VER}{github}.\\ \begin{adjustwidth}{0pt}{1em}\setlength{\parskip}{0.25\baselineskip}% -Copyright © 1997-2019 OpenMP Architecture Review Board.\\ +Copyright © 1997-2020 OpenMP Architecture Review Board.\\ Permission to copy without fee all or part of this material is granted, provided the OpenMP Architecture Review Board copyright notice and the title of this document appear. Notice is given that copying is by diff --git a/latexdiff.cfg b/latexdiff.cfg new file mode 100644 index 0000000..8ee1064 --- /dev/null +++ b/latexdiff.cfg @@ -0,0 +1,5 @@ +PICTUREENV=(?:picture|DIFnomarkup)[\w\d*@]* +VERBATIMLINEENV=(?:boxedcode|omptCallback|omptRecord|omptInquiry|omptEnum|omptOther|ompcPragma|ompfPragma|ompfSyntax|ompfFunction|ompfSubroutine|ompcEnum|ompcFunction|ompfEnum|ompEnv|ompSyntax|indentedcodelist|codepar) +COUNTERCMD=subsubsubsection +CUSTOMDIFCMD=(?:binding|comments|constraints|crossreferences|descr|argdesc|effect|format|restrictions|summary|syntax|events|tools|record|glossaryterm) +FLOATENV=(?:note|(?:c|cpp|ccpp|c90|c99|fortran)specific) diff --git a/openmp-example.tex b/openmp-example.tex index acd49a7..c795675 100644 --- a/openmp-example.tex +++ b/openmp-example.tex @@ -48,9 +48,9 @@ \documentclass[10pt,letterpaper,twoside,makeidx,hidelinks]{scrreprt} % Text to appear in the footer on even-numbered pages: -\newcommand{\VER}{5.0.0} +\newcommand{\VER}{5.0.1} \newcommand{\PVER}{\VER{}p1} -\newcommand{\VERDATE}{February 2018} +\newcommand{\VERDATE}{May 2020} \newcommand{\footerText}{OpenMP Examples Version \PVER{} - \VERDATE} % Unified style sheet for OpenMP documents: diff --git a/openmp-examples.tex b/openmp-examples.tex index dc7f8ef..686e7d1 100644 --- a/openmp-examples.tex +++ b/openmp-examples.tex @@ -49,9 +49,9 @@ \documentclass[10pt,letterpaper,twoside,makeidx,hidelinks]{scrreprt} % Text to appear in the footer on even-numbered pages: -\newcommand{\VER}{5.0.0} +\newcommand{\VER}{5.0.1} \newcommand{\PVER}{\VER{}} -\newcommand{\VERDATE}{November 2019} +\newcommand{\VERDATE}{June 2020} \newcommand{\footerText}{OpenMP Examples Version \PVER{} - \VERDATE} % Unified style sheet for OpenMP documents: @@ -119,6 +119,7 @@ \input{Chap_devices} \input{Examples_target} + \input{Examples_target_defaultmap} \input{Examples_target_pointer_mapping} \input{Examples_target_structure_mapping} \input{Examples_array_sections} @@ -146,6 +147,8 @@ % Forward Depend 370 % simdlen 476 % simd linear modifier 480 + \input{Examples_linear_modifier} + \input{Chap_synchronization} \input{Examples_critical} @@ -182,6 +185,7 @@ \input{Examples_reduction} % User UDR 287 \input{Examples_udr} + \input{Examples_scan} \input{Examples_copyin} \input{Examples_copyprivate} \input{Examples_cpp_reference} diff --git a/openmp.sty b/openmp.sty index e21f365..7bf1fa8 100644 --- a/openmp.sty +++ b/openmp.sty @@ -417,10 +417,10 @@ %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % Code example formatting for the Examples document % This defines: -% /cexample formats blue markers, caption, and code for C examples -% /cppexample formats blue markers, caption, and code for C++ examples -% /fexample formats blue markers, caption, and code for Fortran (fixed) examples -% /ffreeexample formats blue markers, caption, and code for Fortran90 (free) examples +% \cexample formats blue markers, caption, and code for C examples +% \cppexample formats blue markers, caption, and code for C++ examples +% \fexample formats blue markers, caption, and code for Fortran (fixed) examples +% \ffreeexample formats blue markers, caption, and code for Fortran90 (free) examples % Thanks to Jin, Haoqiang H. for the original definitions of the following: \usepackage{color,fancyvrb} % for \VerbatimInput @@ -437,7 +437,7 @@ \newcommand{\escstr}[1]{\myreplace{_}{\_}{#1}} -\def\exampleheader#1#2#3#4{% +\def\exampleheader#1#2#3#4#5{% \ifthenelse{ \equal{#1}{} }{ \def\cname{#2} \def\ename\cname @@ -448,52 +448,61 @@ % Use following for mneumonics \def\ename{\escstr{#1}.#2.#3} } + \newcount\cnt + \cnt=#4 + \ifthenelse{ \equal{#5}{} }{ + \def\vername{} + }{ + \def\myver##1{\toolboxSplitAt{##1}{_}\lefttext\righttext + \lefttext\toolboxIfElse{\ifx\righttext\undefined}% + {\global\advance\cnt by 1}{\expandafter{\righttext}}} + \def\vername{\;\;(\code{\small{}omp\_\myver{#5}})} + } \noindent - \textit{Example \ename} + \textit{Example \ename}\vername + \def\fcnt{\the\cnt} %\vspace*{-3mm} - \code{\VerbatimInput[numbers=left,numbersep=5ex,firstnumber=1,firstline=#4,fontsize=\small]% - %\code{\VerbatimInput[numbers=left,firstnumber=1,firstline=#4,fontsize=\small]% - %\code{\VerbatimInput[firstline=#4,fontsize=\small]% + \code{\VerbatimInput[numbers=left,numbersep=5ex,firstnumber=1,firstline=\fcnt,fontsize=\small]% {sources/Example_\cname}} } -\def\cnexample#1#2{% - \exampleheader{#1}{#2}{c}{8} +\newcommand\cnexample[3][]{% + \exampleheader{#2}{#3}{c}{8}{#1} } -\def\cppnexample#1#2{% - \exampleheader{#1}{#2}{cpp}{8} +\newcommand\cppnexample[3][]{% + \exampleheader{#2}{#3}{cpp}{8}{#1} } -\def\fnexample#1#2{% - \exampleheader{#1}{#2}{f}{6} +\newcommand\fnexample[3][]{% + \exampleheader{#2}{#3}{f}{6}{#1} } -\def\ffreenexample#1#2{% - \exampleheader{#1}{#2}{f90}{6} +\newcommand\ffreenexample[3][]{% + \exampleheader{#2}{#3}{f90}{6}{#1} } -\newcommand\cexample[2]{% +\newcommand\cexample[3][]{% \needspace{5\baselineskip}\ccppspecificstart -\cnexample{#1}{#2} +\cnexample[#1]{#2}{#3} \ccppspecificend } -\newcommand\cppexample[2]{% +\newcommand\cppexample[3][]{% \needspace{5\baselineskip}\cppspecificstart -\cppnexample{#1}{#2} +\cppnexample[#1]{#2}{#3} \cppspecificend } -\newcommand\fexample[2]{% +\newcommand\fexample[3][]{% \needspace{5\baselineskip}\fortranspecificstart -\fnexample{#1}{#2} +\fnexample[#1]{#2}{#3} \fortranspecificend } -\newcommand\ffreeexample[2]{% +\newcommand\ffreeexample[3][]{% \needspace{5\baselineskip}\fortranspecificstart -\ffreenexample{#1}{#2} +\ffreenexample[#1]{#2}{#3} \fortranspecificend } diff --git a/sources/Example_SIMD.1.c b/sources/Example_SIMD.1.c index 64a06f9..948b198 100644 --- a/sources/Example_SIMD.1.c +++ b/sources/Example_SIMD.1.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ void star( double *a, double *b, double *c, int n, int *ioff ) { diff --git a/sources/Example_SIMD.1.f90 b/sources/Example_SIMD.1.f90 index 5d4073a..cdeecbc 100644 --- a/sources/Example_SIMD.1.f90 +++ b/sources/Example_SIMD.1.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 subroutine star(a,b,c,n,ioff_ptr) implicit none double precision :: a(*),b(*),c(*) diff --git a/sources/Example_SIMD.2.c b/sources/Example_SIMD.2.c index d42014c..8fcf9bc 100644 --- a/sources/Example_SIMD.2.c +++ b/sources/Example_SIMD.2.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_4.0 */ #include diff --git a/sources/Example_SIMD.2.f90 b/sources/Example_SIMD.2.f90 index 1ce20d7..b9a7993 100644 --- a/sources/Example_SIMD.2.f90 +++ b/sources/Example_SIMD.2.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_4.0 program main implicit none integer, parameter :: N=32 @@ -19,15 +20,15 @@ program main end program function add1(a,b,fact) result(c) -!$omp declare simd(add1) uniform(fact) implicit none +!$omp declare simd(add1) uniform(fact) double precision :: a,b,fact, c c = a + b + fact end function function add2(a,b,i, fact) result(c) -!$omp declare simd(add2) uniform(a,b,fact) linear(i:1) implicit none +!$omp declare simd(add2) uniform(a,b,fact) linear(i:1) integer :: i double precision :: a(*),b(*),fact, c c = a(i) + b(i) + fact diff --git a/sources/Example_SIMD.3.c b/sources/Example_SIMD.3.c index 47fa8b0..3c733e8 100644 --- a/sources/Example_SIMD.3.c +++ b/sources/Example_SIMD.3.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ double work( double *a, double *b, int n ) { diff --git a/sources/Example_SIMD.3.f90 b/sources/Example_SIMD.3.f90 index 42ecace..7f5fa41 100644 --- a/sources/Example_SIMD.3.f90 +++ b/sources/Example_SIMD.3.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 subroutine work( a, b, n, sum ) implicit none integer :: i, n diff --git a/sources/Example_SIMD.4.c b/sources/Example_SIMD.4.c index de0dc69..af35c75 100644 --- a/sources/Example_SIMD.4.c +++ b/sources/Example_SIMD.4.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ void work( float *b, int n, int m ) { diff --git a/sources/Example_SIMD.4.f90 b/sources/Example_SIMD.4.f90 index 7590519..d01fa56 100644 --- a/sources/Example_SIMD.4.f90 +++ b/sources/Example_SIMD.4.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 subroutine work( b, n, m ) implicit none real :: b(n) diff --git a/sources/Example_SIMD.5.c b/sources/Example_SIMD.5.c index 6d630d8..aa38ee3 100644 --- a/sources/Example_SIMD.5.c +++ b/sources/Example_SIMD.5.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ void work( double **a, double **b, double **c, int n ) { diff --git a/sources/Example_SIMD.5.f90 b/sources/Example_SIMD.5.f90 index e66b716..cd8053b 100644 --- a/sources/Example_SIMD.5.f90 +++ b/sources/Example_SIMD.5.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 subroutine work( a, b, c, n ) implicit none integer :: i,j,n diff --git a/sources/Example_SIMD.6.c b/sources/Example_SIMD.6.c index 33498f5..1433a24 100644 --- a/sources/Example_SIMD.6.c +++ b/sources/Example_SIMD.6.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ #pragma omp declare simd linear(p:1) notinbranch int foo(int *p){ diff --git a/sources/Example_SIMD.6.f90 b/sources/Example_SIMD.6.f90 index 4a4cd05..9ce9ea4 100644 --- a/sources/Example_SIMD.6.f90 +++ b/sources/Example_SIMD.6.f90 @@ -3,9 +3,10 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 function foo(p) result(r) -!$omp declare simd(foo) notinbranch implicit none +!$omp declare simd(foo) notinbranch integer :: p, r p = p + 10 r = p @@ -26,8 +27,8 @@ function myaddint(a, b, n) result(r) end function myaddint function goo(p) result(r) -!$omp declare simd(goo) inbranch implicit none +!$omp declare simd(goo) inbranch real :: p, r p = p + 18.5 r = p diff --git a/sources/Example_SIMD.7.c b/sources/Example_SIMD.7.c index 1d76cf7..64d96b4 100644 --- a/sources/Example_SIMD.7.c +++ b/sources/Example_SIMD.7.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_4.0 */ #include #include diff --git a/sources/Example_SIMD.7.f90 b/sources/Example_SIMD.7.f90 index 1015741..86786a8 100644 --- a/sources/Example_SIMD.7.f90 +++ b/sources/Example_SIMD.7.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_4.0 program fibonacci implicit none integer,parameter :: N=45 @@ -25,8 +26,8 @@ program fibonacci end program recursive function fib(n) result(r) -!$omp declare simd(fib) inbranch implicit none +!$omp declare simd(fib) inbranch integer :: n, r if (n <= 1) then diff --git a/sources/Example_SIMD.8.c b/sources/Example_SIMD.8.c index 7b93930..d873ea5 100644 --- a/sources/Example_SIMD.8.c +++ b/sources/Example_SIMD.8.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_4.0 */ #include #include diff --git a/sources/Example_SIMD.8.f90 b/sources/Example_SIMD.8.f90 index 885d811..c0ff60e 100644 --- a/sources/Example_SIMD.8.f90 +++ b/sources/Example_SIMD.8.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_4.0 module work integer :: P(1000) diff --git a/sources/Example_acquire_release.1.c b/sources/Example_acquire_release.1.c index dd8e6af..d7e1078 100644 --- a/sources/Example_acquire_release.1.c +++ b/sources/Example_acquire_release.1.c @@ -1,9 +1,10 @@ /* * @@name: acquire_release.1.c * @@type: C -* @@compilable: yes, omp_5.0 +* @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_5.0 */ #include diff --git a/sources/Example_acquire_release.1.f90 b/sources/Example_acquire_release.1.f90 index 568fc24..0b617bc 100644 --- a/sources/Example_acquire_release.1.f90 +++ b/sources/Example_acquire_release.1.f90 @@ -1,8 +1,9 @@ ! @@name: acquire_release.1.f90 ! @@type: F-free -! @@compilable: yes, omp_5.0 +! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_5.0 program rel_acq_ex1 use omp_lib diff --git a/sources/Example_acquire_release.2.c b/sources/Example_acquire_release.2.c index 2dae839..2feedbb 100644 --- a/sources/Example_acquire_release.2.c +++ b/sources/Example_acquire_release.2.c @@ -1,9 +1,10 @@ /* * @@name: acquire_release.2.c * @@type: C -* @@compilable: yes, omp_5.0 +* @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_5.0 */ #include diff --git a/sources/Example_acquire_release.2.f90 b/sources/Example_acquire_release.2.f90 index 38a2f9d..ed15571 100644 --- a/sources/Example_acquire_release.2.f90 +++ b/sources/Example_acquire_release.2.f90 @@ -1,8 +1,9 @@ ! @@name: acquire_release.2.f90 ! @@type: F-free -! @@compilable: yes, omp_5.0 +! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_5.0 program rel_acq_ex2 use omp_lib diff --git a/sources/Example_acquire_release.3.c b/sources/Example_acquire_release.3.c index b3f0793..be059ab 100644 --- a/sources/Example_acquire_release.3.c +++ b/sources/Example_acquire_release.3.c @@ -1,9 +1,10 @@ /* * @@name: acquire_release.3.c * @@type: C -* @@compilable: yes, omp_5.0 +* @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_5.0 */ #include diff --git a/sources/Example_acquire_release.3.f90 b/sources/Example_acquire_release.3.f90 index 9caa292..c0fe494 100644 --- a/sources/Example_acquire_release.3.f90 +++ b/sources/Example_acquire_release.3.f90 @@ -1,8 +1,9 @@ ! @@name: acquire_release.3.f90 ! @@type: F-free -! @@compilable: yes, omp_5.0 +! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_5.0 program rel_acq_ex3 use omp_lib diff --git a/sources/Example_acquire_release_broke.4.c b/sources/Example_acquire_release_broke.4.c index 0ecc2b6..b058ee7 100644 --- a/sources/Example_acquire_release_broke.4.c +++ b/sources/Example_acquire_release_broke.4.c @@ -1,9 +1,10 @@ /* * @@name: acquire_release.4.c * @@type: C -* @@compilable: yes, omp_5.0 +* @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_5.0 */ #include diff --git a/sources/Example_acquire_release_broke.4.f90 b/sources/Example_acquire_release_broke.4.f90 index b1c677f..3c17aa7 100644 --- a/sources/Example_acquire_release_broke.4.f90 +++ b/sources/Example_acquire_release_broke.4.f90 @@ -1,8 +1,9 @@ ! @@name: acquire_release.4.f90 ! @@type: F-free -! @@compilable: yes, omp_5.0 +! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_5.0 program rel_acq_ex4 use omp_lib @@ -13,7 +14,7 @@ program rel_acq_ex4 !! !!! THIS CODE WILL FAIL TO PRODUCE CONSISTENT RESULTS !!!!!!! !! !!! DO NOT PROGRAM SYNCHRONIZATION THIS WAY !!!!!!! - !$omp parallel num_threads private(thrd) private(tmp) + !$omp parallel num_threads(2) private(thrd) private(tmp) thrd = omp_get_thread_num() if (thrd == 0) then !$omp critical diff --git a/sources/Example_affinity.1.c b/sources/Example_affinity.1.c index 5e85909..dfb7e68 100644 --- a/sources/Example_affinity.1.c +++ b/sources/Example_affinity.1.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_4.0 */ void work(); diff --git a/sources/Example_affinity.1.f b/sources/Example_affinity.1.f index dbed9e4..3f37bbf 100644 --- a/sources/Example_affinity.1.f +++ b/sources/Example_affinity.1.f @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_4.0 PROGRAM EXAMPLE !$OMP PARALLEL PROC_BIND(SPREAD) NUM_THREADS(4) CALL WORK() diff --git a/sources/Example_affinity.2.c b/sources/Example_affinity.2.c index 76445a5..7c75ba5 100644 --- a/sources/Example_affinity.2.c +++ b/sources/Example_affinity.2.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ void work(); void foo() diff --git a/sources/Example_affinity.2.f90 b/sources/Example_affinity.2.f90 index 322a347..8baf7e8 100644 --- a/sources/Example_affinity.2.f90 +++ b/sources/Example_affinity.2.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 subroutine foo !$omp parallel num_threads(16) proc_bind(spread) call work() diff --git a/sources/Example_affinity.3.c b/sources/Example_affinity.3.c index 9167ce1..c35a063 100644 --- a/sources/Example_affinity.3.c +++ b/sources/Example_affinity.3.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_4.0 */ void work(); int main() diff --git a/sources/Example_affinity.3.f b/sources/Example_affinity.3.f index d07e433..12c8225 100644 --- a/sources/Example_affinity.3.f +++ b/sources/Example_affinity.3.f @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_4.0 PROGRAM EXAMPLE !$OMP PARALLEL PROC_BIND(CLOSE) NUM_THREADS(4) CALL WORK() diff --git a/sources/Example_affinity.4.c b/sources/Example_affinity.4.c index 5c07812..5972414 100644 --- a/sources/Example_affinity.4.c +++ b/sources/Example_affinity.4.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ void work(); void foo() diff --git a/sources/Example_affinity.4.f90 b/sources/Example_affinity.4.f90 index 3ef63c8..b95002b 100644 --- a/sources/Example_affinity.4.f90 +++ b/sources/Example_affinity.4.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 subroutine foo !$omp parallel num_threads(16) proc_bind(close) call work() diff --git a/sources/Example_affinity.5.c b/sources/Example_affinity.5.c index 921156d..e894689 100644 --- a/sources/Example_affinity.5.c +++ b/sources/Example_affinity.5.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_4.0 */ void work(); int main() diff --git a/sources/Example_affinity.5.f b/sources/Example_affinity.5.f index 417890b..42e82ff 100644 --- a/sources/Example_affinity.5.f +++ b/sources/Example_affinity.5.f @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_4.0 PROGRAM EXAMPLE !$OMP PARALLEL PROC_BIND(MASTER) NUM_THREADS(4) CALL WORK() diff --git a/sources/Example_affinity.6.c b/sources/Example_affinity.6.c index e599505..05f102e 100644 --- a/sources/Example_affinity.6.c +++ b/sources/Example_affinity.6.c @@ -1,9 +1,10 @@ /* * @@name: affinity.1.c * @@type: C -* @@compilable: yes, omp_5.0 +* @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_5.0 */ double * alloc_init_B(double *A, int N); diff --git a/sources/Example_affinity.6.f90 b/sources/Example_affinity.6.f90 index 364543c..699d29d 100644 --- a/sources/Example_affinity.6.f90 +++ b/sources/Example_affinity.6.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_5.0 subroutine task_affinity(A, N) diff --git a/sources/Example_affinity_display.1.c b/sources/Example_affinity_display.1.c index 337c092..9e99456 100644 --- a/sources/Example_affinity_display.1.c +++ b/sources/Example_affinity_display.1.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_5.0 */ #include #include diff --git a/sources/Example_affinity_display.1.f90 b/sources/Example_affinity_display.1.f90 index 60519dd..cea3c23 100644 --- a/sources/Example_affinity_display.1.f90 +++ b/sources/Example_affinity_display.1.f90 @@ -1,8 +1,10 @@ ! @@name: affinity_display.1.f90 ! @@type: F-free -! @@compilable: yes, omp_5.0 +! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_5.0 + program affinity_display ! MAX threads = 8, single socket system use omp_lib diff --git a/sources/Example_affinity_display.2.c b/sources/Example_affinity_display.2.c index 5ae2dbe..aa79166 100644 --- a/sources/Example_affinity_display.2.c +++ b/sources/Example_affinity_display.2.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_5.0 */ #include #include diff --git a/sources/Example_affinity_display.2.f90 b/sources/Example_affinity_display.2.f90 index c8e0634..18cdb42 100644 --- a/sources/Example_affinity_display.2.f90 +++ b/sources/Example_affinity_display.2.f90 @@ -1,8 +1,10 @@ ! @@name: affinity_display.2.f90 ! @@type: F-free -! @@compilable: yes, omp_5.0 +! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_5.0 + program affinity_display use omp_lib @@ -43,6 +45,7 @@ program affinity_display end program subroutine socket_work(socket_num, n_thrds) + use omp_lib implicit none integer :: socket_num, n_thrds character(len=0) :: null diff --git a/sources/Example_affinity_display.3.c b/sources/Example_affinity_display.3.c index f4d5765..439a329 100644 --- a/sources/Example_affinity_display.3.c +++ b/sources/Example_affinity_display.3.c @@ -1,9 +1,10 @@ /* * @@name: affinity_display.3.c * @@type: C -* @@compilable: yes, omp_5.0 +* @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_5.0 */ #include #include // also null is in diff --git a/sources/Example_affinity_display.3.f90 b/sources/Example_affinity_display.3.f90 index a777bcd..46800a4 100644 --- a/sources/Example_affinity_display.3.f90 +++ b/sources/Example_affinity_display.3.f90 @@ -1,8 +1,10 @@ ! @@name: affinity_display.3.f90 ! @@type: F-free -! @@compilable: yes, omp_5.0 +! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_5.0 + program affinity_display use omp_lib implicit none diff --git a/sources/Example_affinity_query.1.c b/sources/Example_affinity_query.1.c index c89af2b..0cbc18a 100644 --- a/sources/Example_affinity_query.1.c +++ b/sources/Example_affinity_query.1.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.5 */ #include #include diff --git a/sources/Example_affinity_query.1.f90 b/sources/Example_affinity_query.1.f90 index cdd08ef..86bcba0 100644 --- a/sources/Example_affinity_query.1.f90 +++ b/sources/Example_affinity_query.1.f90 @@ -3,6 +3,8 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.5 + subroutine socket_init(socket_num) use omp_lib integer :: socket_num, n_procs diff --git a/sources/Example_allocators.1.c b/sources/Example_allocators.1.c index 86e3128..4c1ce6a 100644 --- a/sources/Example_allocators.1.c +++ b/sources/Example_allocators.1.c @@ -1,9 +1,10 @@ /* * @@name: allocators.1c * @@type: C -* @@compilable: yes, omp_5.0 +* @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_5.0 */ #include #include diff --git a/sources/Example_allocators.1.f90 b/sources/Example_allocators.1.f90 index 87abb11..7fe4f4b 100644 --- a/sources/Example_allocators.1.f90 +++ b/sources/Example_allocators.1.f90 @@ -1,8 +1,9 @@ ! @@name: allocators.1f90 ! @@type: F-free -! @@compilable: yes, omp_5.0 +! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_5.0 program main use omp_lib diff --git a/sources/Example_array_sections.1.c b/sources/Example_array_sections.1.c index 1d810b1..e5aa0e4 100644 --- a/sources/Example_array_sections.1.c +++ b/sources/Example_array_sections.1.c @@ -4,6 +4,7 @@ * @@compilable: no * @@linkable: no * @@expect: failure +* @@version: omp_4.0 */ void foo () { diff --git a/sources/Example_array_sections.1.f90 b/sources/Example_array_sections.1.f90 index 49758b6..5a565af 100644 --- a/sources/Example_array_sections.1.f90 +++ b/sources/Example_array_sections.1.f90 @@ -3,6 +3,7 @@ ! @@compilable: no ! @@linkable: no ! @@expect: failure +! @@version: omp_4.0 subroutine foo() integer :: A(30) A = 1 diff --git a/sources/Example_array_sections.2.c b/sources/Example_array_sections.2.c index 09c8822..20239c2 100644 --- a/sources/Example_array_sections.2.c +++ b/sources/Example_array_sections.2.c @@ -4,6 +4,7 @@ * @@compilable: no * @@linkable: no * @@expect: failure +* @@version: omp_4.0 */ void foo () { diff --git a/sources/Example_array_sections.2.f90 b/sources/Example_array_sections.2.f90 index c61d1d3..891a386 100644 --- a/sources/Example_array_sections.2.f90 +++ b/sources/Example_array_sections.2.f90 @@ -3,6 +3,7 @@ ! @@compilable: no ! @@linkable: no ! @@expect: failure +! @@version: omp_4.0 subroutine foo() integer,target :: A(30) integer,pointer :: p(:) diff --git a/sources/Example_array_sections.3.c b/sources/Example_array_sections.3.c index 4486628..a6641c6 100644 --- a/sources/Example_array_sections.3.c +++ b/sources/Example_array_sections.3.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ void foo () { diff --git a/sources/Example_array_sections.3.f90 b/sources/Example_array_sections.3.f90 index c20d7dd..57bcc2c 100644 --- a/sources/Example_array_sections.3.f90 +++ b/sources/Example_array_sections.3.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 subroutine foo() integer,target :: A(30) integer,pointer :: p(:) diff --git a/sources/Example_array_sections.4.c b/sources/Example_array_sections.4.c index 6d1774e..fb6f4f7 100644 --- a/sources/Example_array_sections.4.c +++ b/sources/Example_array_sections.4.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ void foo () { diff --git a/sources/Example_array_sections.4.f90 b/sources/Example_array_sections.4.f90 index aa06f1c..e2c0fe9 100644 --- a/sources/Example_array_sections.4.f90 +++ b/sources/Example_array_sections.4.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 subroutine foo() integer,target :: A(30) integer,pointer :: p(:) diff --git a/sources/Example_array_shaping.1.c b/sources/Example_array_shaping.1.c index 88d0dd3..e6eb40d 100644 --- a/sources/Example_array_shaping.1.c +++ b/sources/Example_array_shaping.1.c @@ -1,9 +1,10 @@ /* * @@name: array_shaping.1.c -* @@type: C, omp_5.0 +* @@type: C * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_5.0 */ #pragma omp declare target int do_work(double *a, int nx, int ny); diff --git a/sources/Example_array_shaping.1.f90 b/sources/Example_array_shaping.1.f90 new file mode 100644 index 0000000..0a30422 --- /dev/null +++ b/sources/Example_array_shaping.1.f90 @@ -0,0 +1,60 @@ +! @@name: array_shaping.1.f90 +! @@type: F-free +! @@compilable: yes +! @@linkable: no +! @@expect: success +! @@version: omp_5.0 +module m + interface + subroutine do_work(a, nx, ny) + !$omp declare target to(do_work) + integer, intent(in) :: nx, ny + double precision a(0:nx+1,ny) + end subroutine do_work + + subroutine other_work(a, nx, ny) + !$omp declare target to(other_work) + integer, intent(in) :: nx, ny + double precision a(0:nx+1,ny) + end subroutine other_work + + subroutine exch_data(a, nx, ny) + integer, intent(in) :: nx, ny + double precision a(0:nx+1,ny) + end subroutine exch_data + end interface +end module m + +subroutine array_shaping(a, nx, ny) + use m + implicit none + integer, intent(in) :: nx, ny + double precision a(0:nx+1,ny) + + ! map data to device and do work + !$omp target data map(a) + + ! do work on the device + !$omp target ! map(a) is optional here + call do_work(a, nx, ny) + !$omp end target + + ! update boundary points (two rows of 2D array) on the host. + ! data transferred are noncontiguous + !$omp target update from( a(1,1:ny), a(nx,1:ny) ) + + ! exchange ghost points with neighbors + call exch_data(a, nx, ny) + + ! update ghost points (two rows of 2D array) on the device. + ! data transferred are noncontiguous + !$omp target update to( a(0,1:ny), a(nx+1,1:ny) ) + + ! perform other work on the device + !$omp target ! map(a) is optional here + call other_work(a, nx, ny) + !$omp end target + + !$omp end target data + +end subroutine diff --git a/sources/Example_associate.1.f b/sources/Example_associate.1.f index 745dc0b..500db20 100644 --- a/sources/Example_associate.1.f +++ b/sources/Example_associate.1.f @@ -3,7 +3,8 @@ ! @@compilable: no ! @@linkable: no ! @@expect: failure - program example +! @@version: omp_4.0 + program example_broken real :: a, c associate (b => a) !$omp parallel private(b, c) ! invalid to privatize b diff --git a/sources/Example_associate.2.f b/sources/Example_associate.2.f index deea829..c0787c8 100644 --- a/sources/Example_associate.2.f +++ b/sources/Example_associate.2.f @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_4.0 program example use omp_lib integer i diff --git a/sources/Example_associate.3.f90 b/sources/Example_associate.3.f90 index 2d75291..bd2c209 100644 --- a/sources/Example_associate.3.f90 +++ b/sources/Example_associate.3.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_4.0 program example integer :: v v = 15 diff --git a/sources/Example_async_target.1.c b/sources/Example_async_target.1.c index 89c7770..f9bbf33 100644 --- a/sources/Example_async_target.1.c +++ b/sources/Example_async_target.1.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ #pragma omp declare target float F(float); diff --git a/sources/Example_async_target.1.f90 b/sources/Example_async_target.1.f90 index 3b454d4..e25876a 100644 --- a/sources/Example_async_target.1.f90 +++ b/sources/Example_async_target.1.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 module parameters integer, parameter :: N=1000000000, CHUNKSZ=1000000 end module diff --git a/sources/Example_async_target.2.c b/sources/Example_async_target.2.c index 7b1555f..45aca25 100644 --- a/sources/Example_async_target.2.c +++ b/sources/Example_async_target.2.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ #include #include diff --git a/sources/Example_async_target.2.f90 b/sources/Example_async_target.2.f90 index 40249b4..acc409a 100644 --- a/sources/Example_async_target.2.f90 +++ b/sources/Example_async_target.2.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 subroutine mult(p, N, idev) use omp_lib, ONLY: omp_is_initial_device real :: p(N) diff --git a/sources/Example_async_target.3.c b/sources/Example_async_target.3.c index bc4165a..97157c0 100644 --- a/sources/Example_async_target.3.c +++ b/sources/Example_async_target.3.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.5 */ #include diff --git a/sources/Example_async_target.3.f90 b/sources/Example_async_target.3.f90 index 6d48101..7b2122f 100644 --- a/sources/Example_async_target.3.f90 +++ b/sources/Example_async_target.3.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.5 program concurrent_async use omp_lib diff --git a/sources/Example_async_target.4.c b/sources/Example_async_target.4.c index d2ec306..b4843b1 100644 --- a/sources/Example_async_target.4.c +++ b/sources/Example_async_target.4.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.5 */ extern void init( float*, int); diff --git a/sources/Example_async_target.4.f90 b/sources/Example_async_target.4.f90 index 6896617..f258d84 100644 --- a/sources/Example_async_target.4.f90 +++ b/sources/Example_async_target.4.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.5 subroutine vec_mult(N) implicit none diff --git a/sources/Example_atomic.1.c b/sources/Example_atomic.1.c index 2bec0f3..e83dcec 100644 --- a/sources/Example_atomic.1.c +++ b/sources/Example_atomic.1.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_3.1 */ float work1(int i) { diff --git a/sources/Example_atomic.1.f b/sources/Example_atomic.1.f index 74bc5cf..20015a3 100644 --- a/sources/Example_atomic.1.f +++ b/sources/Example_atomic.1.f @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_3.1 REAL FUNCTION WORK1(I) INTEGER I WORK1 = 1.0 * I diff --git a/sources/Example_atomic.2.c b/sources/Example_atomic.2.c index 3250af5..7f3797e 100644 --- a/sources/Example_atomic.2.c +++ b/sources/Example_atomic.2.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_3.1 */ int atomic_read(const int *p) { diff --git a/sources/Example_atomic.2.f b/sources/Example_atomic.2.f index 490d1bb..4e5dfab 100644 --- a/sources/Example_atomic.2.f +++ b/sources/Example_atomic.2.f @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_3.1 function atomic_read(p) integer :: atomic_read integer, intent(in) :: p diff --git a/sources/Example_atomic.3.c b/sources/Example_atomic.3.c index f85a6ad..8cf0a6b 100644 --- a/sources/Example_atomic.3.c +++ b/sources/Example_atomic.3.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_3.1 */ int fetch_and_add(int *p) { diff --git a/sources/Example_atomic.3.f b/sources/Example_atomic.3.f index d71941d..c805923 100644 --- a/sources/Example_atomic.3.f +++ b/sources/Example_atomic.3.f @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_3.1 function fetch_and_add(p) integer:: fetch_and_add integer, intent(inout) :: p diff --git a/sources/Example_atomic_restrict.1.c b/sources/Example_atomic_restrict.1.c index 2b66ece..679a8a3 100644 --- a/sources/Example_atomic_restrict.1.c +++ b/sources/Example_atomic_restrict.1.c @@ -4,6 +4,7 @@ * @@compilable: maybe * @@linkable: no * @@expect: failure +* @@version: omp_3.1 */ void atomic_wrong () { diff --git a/sources/Example_atomic_restrict.1.f b/sources/Example_atomic_restrict.1.f index f4f5b45..5f2e28f 100644 --- a/sources/Example_atomic_restrict.1.f +++ b/sources/Example_atomic_restrict.1.f @@ -3,6 +3,7 @@ ! @@compilable: maybe ! @@linkable: no ! @@expect: failure +! @@version: omp_3.1 SUBROUTINE ATOMIC_WRONG() INTEGER:: I REAL:: R diff --git a/sources/Example_atomic_restrict.2.c b/sources/Example_atomic_restrict.2.c index b68b08e..37fcce7 100644 --- a/sources/Example_atomic_restrict.2.c +++ b/sources/Example_atomic_restrict.2.c @@ -4,6 +4,7 @@ * @@compilable: maybe * @@linkable: no * @@expect: failure +* @@version: omp_3.1 */ void atomic_wrong2 () { diff --git a/sources/Example_atomic_restrict.2.f b/sources/Example_atomic_restrict.2.f index 8cf2008..71467c0 100644 --- a/sources/Example_atomic_restrict.2.f +++ b/sources/Example_atomic_restrict.2.f @@ -3,6 +3,7 @@ ! @@compilable: maybe ! @@linkable: no ! @@expect: failure +! @@version: omp_3.1 SUBROUTINE SUB() COMMON /BLK/ R REAL R diff --git a/sources/Example_atomic_restrict.3.f b/sources/Example_atomic_restrict.3.f index e5659cd..7ab0165 100644 --- a/sources/Example_atomic_restrict.3.f +++ b/sources/Example_atomic_restrict.3.f @@ -3,6 +3,7 @@ ! @@compilable: maybe ! @@linkable: no ! @@expect: failure +! @@version: omp_3.1 SUBROUTINE ATOMIC_WRONG3 INTEGER:: I REAL:: R diff --git a/sources/Example_cancellation.1.cpp b/sources/Example_cancellation.1.cpp index 3ef5589..8d99779 100644 --- a/sources/Example_cancellation.1.cpp +++ b/sources/Example_cancellation.1.cpp @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ #include #include diff --git a/sources/Example_cancellation.1.f90 b/sources/Example_cancellation.1.f90 index ed94cae..8410b1d 100644 --- a/sources/Example_cancellation.1.f90 +++ b/sources/Example_cancellation.1.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 subroutine example(n, dim) integer, intent(in) :: n, dim(n) integer :: i, s, err diff --git a/sources/Example_cancellation.2.c b/sources/Example_cancellation.2.c index d038029..283ce7c 100644 --- a/sources/Example_cancellation.2.c +++ b/sources/Example_cancellation.2.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ #include diff --git a/sources/Example_cancellation.2.f90 b/sources/Example_cancellation.2.f90 index f9132aa..590ed04 100644 --- a/sources/Example_cancellation.2.f90 +++ b/sources/Example_cancellation.2.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 module parallel_search type binary_tree integer :: value diff --git a/sources/Example_collapse.1.c b/sources/Example_collapse.1.c index dcb8810..0478795 100644 --- a/sources/Example_collapse.1.c +++ b/sources/Example_collapse.1.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_3.0 */ void bar(float *a, int i, int j, int k); diff --git a/sources/Example_collapse.1.f b/sources/Example_collapse.1.f index ca93b6d..47faa16 100644 --- a/sources/Example_collapse.1.f +++ b/sources/Example_collapse.1.f @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_3.0 subroutine sub(a) diff --git a/sources/Example_collapse.2.c b/sources/Example_collapse.2.c index 55f090b..2f63aeb 100644 --- a/sources/Example_collapse.2.c +++ b/sources/Example_collapse.2.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_3.0 */ #include diff --git a/sources/Example_collapse.2.f b/sources/Example_collapse.2.f index 189f565..1c65f76 100644 --- a/sources/Example_collapse.2.f +++ b/sources/Example_collapse.2.f @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_3.0 program test !$omp parallel diff --git a/sources/Example_collapse.3.c b/sources/Example_collapse.3.c index 45b5e46..30d5411 100644 --- a/sources/Example_collapse.3.c +++ b/sources/Example_collapse.3.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_3.0 */ #include #include diff --git a/sources/Example_collapse.3.f b/sources/Example_collapse.3.f index f1339a8..b970ba0 100644 --- a/sources/Example_collapse.3.f +++ b/sources/Example_collapse.3.f @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_3.0 program test include 'omp_lib.h' !$omp parallel num_threads(2) diff --git a/sources/Example_cpp_reference.1.cpp b/sources/Example_cpp_reference.1.cpp index 6a7fc11..5c63ff5 100644 --- a/sources/Example_cpp_reference.1.cpp +++ b/sources/Example_cpp_reference.1.cpp @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.5 */ void task_body (int &); diff --git a/sources/Example_critical.2.f b/sources/Example_critical.2.f index ec19a5e..ae4997e 100644 --- a/sources/Example_critical.2.f +++ b/sources/Example_critical.2.f @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.5 SUBROUTINE CRITICAL_EXAMPLE(X, Y) USE OMP_LIB ! or INCLUDE "omp_lib.h" diff --git a/sources/Example_declare_target.1.c b/sources/Example_declare_target.1.c index 5a7c980..1e54e91 100644 --- a/sources/Example_declare_target.1.c +++ b/sources/Example_declare_target.1.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ #pragma omp declare target extern void fib(int N); diff --git a/sources/Example_declare_target.1.f90 b/sources/Example_declare_target.1.f90 index ce0cf9c..7c06616 100644 --- a/sources/Example_declare_target.1.f90 +++ b/sources/Example_declare_target.1.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_4.0 module module_fib contains subroutine fib(N) diff --git a/sources/Example_declare_target.2.cpp b/sources/Example_declare_target.2.cpp index f151cd8..9365201 100644 --- a/sources/Example_declare_target.2.cpp +++ b/sources/Example_declare_target.2.cpp @@ -4,6 +4,7 @@ * @@compilable: no * @@linkable: no * @@expect: failure +* @@version: omp_4.0 */ struct typeX { diff --git a/sources/Example_declare_target.2.f90 b/sources/Example_declare_target.2.f90 index 2c95967..061e24a 100644 --- a/sources/Example_declare_target.2.f90 +++ b/sources/Example_declare_target.2.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_4.0 program my_fib integer :: N = 8 !$omp declare target(fib) diff --git a/sources/Example_declare_target.3.c b/sources/Example_declare_target.3.c index 31bc938..a9c3027 100644 --- a/sources/Example_declare_target.3.c +++ b/sources/Example_declare_target.3.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ #define N 1000 #pragma omp declare target diff --git a/sources/Example_declare_target.3.f90 b/sources/Example_declare_target.3.f90 index 1598519..5bb96e2 100644 --- a/sources/Example_declare_target.3.f90 +++ b/sources/Example_declare_target.3.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 module my_arrays !$omp declare target (N, p, v1, v2) integer, parameter :: N=1000 diff --git a/sources/Example_declare_target.4.c b/sources/Example_declare_target.4.c index 2a74d6e..16cee20 100644 --- a/sources/Example_declare_target.4.c +++ b/sources/Example_declare_target.4.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ #define N 10000 #pragma omp declare target diff --git a/sources/Example_declare_target.4.f90 b/sources/Example_declare_target.4.f90 index 12ee23e..080da71 100644 --- a/sources/Example_declare_target.4.f90 +++ b/sources/Example_declare_target.4.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 module my_global_array !$omp declare target (N,Q) integer, parameter :: N=10 diff --git a/sources/Example_declare_target.5.c b/sources/Example_declare_target.5.c index 394fa1f..ced21de 100644 --- a/sources/Example_declare_target.5.c +++ b/sources/Example_declare_target.5.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ #define N 10000 #define M 1024 diff --git a/sources/Example_declare_target.5.f90 b/sources/Example_declare_target.5.f90 index 0f9809c..62902c3 100644 --- a/sources/Example_declare_target.5.f90 +++ b/sources/Example_declare_target.5.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 module my_global_array !$omp declare target (N,Q) integer, parameter :: N=10000, M=1024 diff --git a/sources/Example_declare_target.6.c b/sources/Example_declare_target.6.c index 99b3332..e8b383e 100644 --- a/sources/Example_declare_target.6.c +++ b/sources/Example_declare_target.6.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.5 */ #define N 100000000 diff --git a/sources/Example_declare_target.6.f90 b/sources/Example_declare_target.6.f90 index b226527..e702252 100644 --- a/sources/Example_declare_target.6.f90 +++ b/sources/Example_declare_target.6.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.5 module m_dat integer, parameter :: N=100000000 !$omp declare target link(sp,sv1,sv2) diff --git a/sources/Example_declare_variant.1.c b/sources/Example_declare_variant.1.c index 40d2f08..f7f457e 100644 --- a/sources/Example_declare_variant.1.c +++ b/sources/Example_declare_variant.1.c @@ -1,9 +1,10 @@ /* * @@name: declare_variant.1c * @@type: C -* @@compilable: yes, omp_5.0 +* @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_5.0 */ #define N 100 @@ -32,6 +33,7 @@ void t_vxv(int *v1,int *v2,int *v3,int n) // function variant #pragma omp distribute simd for (int i= 0; i< n; i++) v3[i] = v1[i] * v2[i]*2; } +#pragma omp end declare target int main() { diff --git a/sources/Example_declare_variant.1.f90 b/sources/Example_declare_variant.1.f90 index 1cb6aef..06d425f 100644 --- a/sources/Example_declare_variant.1.f90 +++ b/sources/Example_declare_variant.1.f90 @@ -1,8 +1,9 @@ ! @@name: declare_variant.1f90 ! @@type: F-free -! @@compilable: yes, omp_5.0 +! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_5.0 module subs use omp_lib diff --git a/sources/Example_declare_variant.2.c b/sources/Example_declare_variant.2.c index 6f0ecd6..96533e3 100644 --- a/sources/Example_declare_variant.2.c +++ b/sources/Example_declare_variant.2.c @@ -1,9 +1,10 @@ /* * @@name: declare_variant.2c * @@type: C -* @@compilable: yes, omp_5.0 +* @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_5.0 */ #include diff --git a/sources/Example_declare_variant.2.f90 b/sources/Example_declare_variant.2.f90 index d15e560..cdf08c8 100644 --- a/sources/Example_declare_variant.2.f90 +++ b/sources/Example_declare_variant.2.f90 @@ -1,8 +1,9 @@ ! @@name: declare_variant.2f90 ! @@type: F-free -! @@compilable: yes, omp_5.0 +! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_5.0 module subs use omp_lib diff --git a/sources/Example_depobj.1.c b/sources/Example_depobj.1.c index 5230912..bae1031 100644 --- a/sources/Example_depobj.1.c +++ b/sources/Example_depobj.1.c @@ -1,9 +1,10 @@ /* * @@name: depobj.1c * @@type: C -* @@compilable: yes, omp_5.0 +* @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_5.0 */ #include diff --git a/sources/Example_depobj.1.f90 b/sources/Example_depobj.1.f90 index aa5d6ec..1c03e40 100644 --- a/sources/Example_depobj.1.f90 +++ b/sources/Example_depobj.1.f90 @@ -1,8 +1,10 @@ ! @@name: depobj.1f90 ! @@type: F-free -! @@compilable: yes, omp_5.0 +! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_5.0 + program main use omp_lib implicit none diff --git a/sources/Example_device.1.c b/sources/Example_device.1.c index f7a637c..3942275 100644 --- a/sources/Example_device.1.c +++ b/sources/Example_device.1.c @@ -4,16 +4,20 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ #include #include + #pragma omp declare target void vec_mult(float *p, float *v1, float *v2, int N); extern float *p, *v1, *v2; extern int N; #pragma omp end declare target + extern void init_vars(float *, float *, int); extern void output(float *, int); + void foo() { init_vars(v1, v2, N); @@ -23,6 +27,7 @@ void foo() } output(p, N); } + void vec_mult(float *p, float *v1, float *v2, int N) { int i; diff --git a/sources/Example_device.1.f90 b/sources/Example_device.1.f90 index aa90809..6d1e1d4 100644 --- a/sources/Example_device.1.f90 +++ b/sources/Example_device.1.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_4.0 module params integer,parameter :: N=1024 end module params diff --git a/sources/Example_device.2.c b/sources/Example_device.2.c index e3af83c..75cdaa7 100644 --- a/sources/Example_device.2.c +++ b/sources/Example_device.2.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ #include extern void init(float *, float *, int); diff --git a/sources/Example_device.2.f90 b/sources/Example_device.2.f90 index 038adb7..72ba85b 100644 --- a/sources/Example_device.2.f90 +++ b/sources/Example_device.2.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 subroutine vec_mult(p, v1, v2, N) use omp_lib, ONLY : omp_get_num_devices real :: p(N), v1(N), v2(N) diff --git a/sources/Example_device.3.c b/sources/Example_device.3.c index 9782334..db85359 100644 --- a/sources/Example_device.3.c +++ b/sources/Example_device.3.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ #include #include diff --git a/sources/Example_device.3.f90 b/sources/Example_device.3.f90 index c9d787a..e94ffe5 100644 --- a/sources/Example_device.3.f90 +++ b/sources/Example_device.3.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_4.0 program foo use omp_lib, ONLY : omp_get_default_device, omp_set_default_device integer :: old_default_device, new_default_device diff --git a/sources/Example_device.4.c b/sources/Example_device.4.c index e8a1ea0..eabcc63 100644 --- a/sources/Example_device.4.c +++ b/sources/Example_device.4.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.5 */ #include #include diff --git a/sources/Example_doacross.1.c b/sources/Example_doacross.1.c index e2a7824..3a0ca97 100644 --- a/sources/Example_doacross.1.c +++ b/sources/Example_doacross.1.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.5 */ float foo(int i); float bar(float a, float b); diff --git a/sources/Example_doacross.1.f90 b/sources/Example_doacross.1.f90 index f344905..bce32db 100644 --- a/sources/Example_doacross.1.f90 +++ b/sources/Example_doacross.1.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.5 subroutine work( N, A, B, C ) integer :: N, i real, dimension(N) :: A, B, C diff --git a/sources/Example_doacross.2.c b/sources/Example_doacross.2.c index ba9ac9f..f2613fc 100644 --- a/sources/Example_doacross.2.c +++ b/sources/Example_doacross.2.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.5 */ float foo(int i, int j); float bar(float a, float b, float c); diff --git a/sources/Example_doacross.2.f90 b/sources/Example_doacross.2.f90 index d8aa9b6..75aefa0 100644 --- a/sources/Example_doacross.2.f90 +++ b/sources/Example_doacross.2.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.5 subroutine work( N, M, A, B, C ) integer :: N, M, i, j real, dimension(M,N) :: A, B, C diff --git a/sources/Example_doacross.3.c b/sources/Example_doacross.3.c index 8abd8ab..8b3bf44 100644 --- a/sources/Example_doacross.3.c +++ b/sources/Example_doacross.3.c @@ -4,6 +4,7 @@ * @@compilable: no * @@linkable: no * @@expect: failure +* @@version: omp_4.5 */ #define N 100 diff --git a/sources/Example_doacross.3.f90 b/sources/Example_doacross.3.f90 index 84ab56d..546a3f9 100644 --- a/sources/Example_doacross.3.f90 +++ b/sources/Example_doacross.3.f90 @@ -3,6 +3,7 @@ ! @@compilable: no ! @@linkable: no ! @@expect: failure +! @@version: omp_4.5 subroutine work_wrong(N, p) integer :: N real(8), dimension(N,N,N) :: p diff --git a/sources/Example_doacross.4.c b/sources/Example_doacross.4.c index 4803c5e..b476c41 100644 --- a/sources/Example_doacross.4.c +++ b/sources/Example_doacross.4.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.5 */ double foo(int i, int j); diff --git a/sources/Example_doacross.4.f90 b/sources/Example_doacross.4.f90 index e39daaf..8040fc3 100644 --- a/sources/Example_doacross.4.f90 +++ b/sources/Example_doacross.4.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.5 subroutine work( N, M, A, B, C ) integer :: N, M real(8), dimension(M, N) :: A, B, C diff --git a/sources/Example_doacross.5.c b/sources/Example_doacross.5.c index e2a7824..3a0ca97 100644 --- a/sources/Example_doacross.5.c +++ b/sources/Example_doacross.5.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.5 */ float foo(int i); float bar(float a, float b); diff --git a/sources/Example_doacross.5.f90 b/sources/Example_doacross.5.f90 index f344905..bce32db 100644 --- a/sources/Example_doacross.5.f90 +++ b/sources/Example_doacross.5.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.5 subroutine work( N, A, B, C ) integer :: N, i real, dimension(N) :: A, B, C diff --git a/sources/Example_host_teams.1.c b/sources/Example_host_teams.1.c index d26df9d..4cb5d6d 100644 --- a/sources/Example_host_teams.1.c +++ b/sources/Example_host_teams.1.c @@ -1,9 +1,10 @@ /* * @@name: host_teams.2.c * @@type: C -* @@compilable: yes, omp_5.0 +* @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_5.0 */ #include #include diff --git a/sources/Example_host_teams.1.f90 b/sources/Example_host_teams.1.f90 index bdc1a3e..0ea5ac0 100644 --- a/sources/Example_host_teams.1.f90 +++ b/sources/Example_host_teams.1.f90 @@ -1,8 +1,9 @@ ! @@name: host_teams.2.f90 ! @@type: F-free -! @@compilable: yes, omp_5.0 +! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_5.0 program main use omp_lib diff --git a/sources/Example_init_lock_with_hint.1.cpp b/sources/Example_init_lock_with_hint.1.cpp index d50b62d..1971c14 100644 --- a/sources/Example_init_lock_with_hint.1.cpp +++ b/sources/Example_init_lock_with_hint.1.cpp @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.5 */ #include diff --git a/sources/Example_init_lock_with_hint.1.f b/sources/Example_init_lock_with_hint.1.f index b0f8cfe..56603c8 100644 --- a/sources/Example_init_lock_with_hint.1.f +++ b/sources/Example_init_lock_with_hint.1.f @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.5 FUNCTION NEW_LOCKS() USE OMP_LIB ! or INCLUDE "omp_lib.h" INTEGER(OMP_LOCK_KIND), DIMENSION(1000) :: NEW_LOCKS diff --git a/sources/Example_lastprivate.2.c b/sources/Example_lastprivate.2.c new file mode 100644 index 0000000..057f9eb --- /dev/null +++ b/sources/Example_lastprivate.2.c @@ -0,0 +1,23 @@ +/* +* @@name: lastprivate.2c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +* @@version: omp_5.0 +*/ +#include + +float condlastprivate(float *a, int n) +{ + float x = 0.0f; + + #pragma omp parallel for simd lastprivate(conditional: x) + for (int k = 0; k < n; k++) { + if (a[k] < 108.5 || a[k] > 208.5) { + x = sinf(a[k]); + } + } + + return x; +} diff --git a/sources/Example_lastprivate.2.f90 b/sources/Example_lastprivate.2.f90 new file mode 100644 index 0000000..0ec310e --- /dev/null +++ b/sources/Example_lastprivate.2.f90 @@ -0,0 +1,21 @@ +! @@name: lastprivate.2f +! @@type: F-free +! @@compilable: yes +! @@linkable: no +! @@expect: success +! @@version: omp_5.0 +function condlastprivate(a, n) result(x) + implicit none + real a(*), x + integer n, k + + x = 0.0 + + !$omp parallel do simd lastprivate(conditional: x) + do k = 1, n + if (a(k) < 108.5 .or. a(k) > 208.5) then + x = sin(a(k)) + endif + end do + +end function condlastprivate diff --git a/sources/Example_linear_in_loop.1.c b/sources/Example_linear_in_loop.1.c index f6deeda..7222bab 100644 --- a/sources/Example_linear_in_loop.1.c +++ b/sources/Example_linear_in_loop.1.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_4.5 */ #include diff --git a/sources/Example_linear_in_loop.1.f90 b/sources/Example_linear_in_loop.1.f90 index 5edc41d..fad40fc 100644 --- a/sources/Example_linear_in_loop.1.f90 +++ b/sources/Example_linear_in_loop.1.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_4.5 program linear_loop implicit none integer, parameter :: N = 100 diff --git a/sources/Example_linear_modifier.1.cpp b/sources/Example_linear_modifier.1.cpp new file mode 100644 index 0000000..dee84da --- /dev/null +++ b/sources/Example_linear_modifier.1.cpp @@ -0,0 +1,45 @@ +/* +* @@name: linear_modifier.1cpp +* @@type: C++ +* @@compilable: yes +* @@linkable: yes +* @@expect: success +* @@version: omp_4.5 +*/ +#include + +#define NN 1023 +int a[NN]; + +#pragma omp declare simd linear(ref(p)) simdlen(8) +void add_one2(int& p) +{ + p += 1; +} + +int main(void) +{ + int i; + int* p = a; + + for (i = 0; i < NN; i++) { + a[i] = i; + } + +#pragma omp simd linear(p) simdlen(8) + for (i = 0; i < NN; i++) { + int& k = *p; + add_one2(k); + add_one2(a[i]); + p++; + } + + for (i = 0; i < NN; i++) { + if (a[i] != i+2) { + printf("failed\n"); + return 1; + } + } + printf("passed\n"); + return 0; +} diff --git a/sources/Example_linear_modifier.1.f90 b/sources/Example_linear_modifier.1.f90 new file mode 100644 index 0000000..04fc8c4 --- /dev/null +++ b/sources/Example_linear_modifier.1.f90 @@ -0,0 +1,48 @@ +! @@name: linear_modifier.1.f90 +! @@type: F-free +! @@compilable: yes +! @@linkable: yes +! @@expect: success +! @@version: omp_4.5 +module m + integer, parameter :: NN = 1023 + integer :: a(NN) + + contains + subroutine add_one2(p) + !$omp declare simd(add_one2) linear(ref(p)) simdlen(8) + implicit none + integer :: p + + p = p + 1 + end subroutine +end module + +program main + use m + implicit none + integer :: i, p + + do i = 1, NN + a(i) = i + end do + + p = 1 + !$omp simd linear(p) simdlen(8) + do i = 1, NN + associate(k => a(p)) + call add_one2(k) + end associate + call add_one2(a(i)) + p = p + 1 + end do + + do i = 1, NN + if (a(i) /= i+2) then + print *, "failed" + stop + endif + end do + print *, "passed" +end program + diff --git a/sources/Example_linear_modifier.2.cpp b/sources/Example_linear_modifier.2.cpp new file mode 100644 index 0000000..6b66595 --- /dev/null +++ b/sources/Example_linear_modifier.2.cpp @@ -0,0 +1,44 @@ +/* +* @@name: linear_modifier.2cpp +* @@type: C++ +* @@compilable: yes +* @@linkable: yes +* @@expect: success +* @@version: omp_4.5 +*/ +#include + +#define NN 1023 +int a[NN]; + +#pragma omp declare simd linear(ref(p)) linear(uval(i)) +void add_one2(int& p, const int& i) +{ + p += i; +} + +int main(void) +{ + int i; + int* p = a; + + for (i = 0; i < NN; i++) { + a[i] = i; + } + + #pragma omp simd linear(p) + for (i = 0; i < NN; i++) { + int& k = *p; + add_one2(k, i); + p++; + } + + for (i = 0; i < NN; i++) { + if (a[i] != i*2) { + printf("failed\n"); + return 1; + } + } + printf("passed\n"); + return 0; +} diff --git a/sources/Example_linear_modifier.2.f90 b/sources/Example_linear_modifier.2.f90 new file mode 100644 index 0000000..911157d --- /dev/null +++ b/sources/Example_linear_modifier.2.f90 @@ -0,0 +1,45 @@ +! @@name: linear_modifier.2f90 +! @@type: F-free +! @@compilable: yes +! @@linkable: yes +! @@expect: success +! @@version: omp_4.5 +module m + integer, parameter :: NN = 1023 + integer :: a(NN) + + contains + subroutine add_one2(p, i) + !$omp declare simd(add_one2) linear(ref(p)) linear(uval(i)) + implicit none + integer :: p + integer, intent(in) :: i + + p = p + i + end subroutine +end module + +program main + use m + implicit none + integer :: i, p + + do i = 1, NN + a(i) = i + end do + + p = 1 + !$omp simd linear(p) + do i = 1, NN + call add_one2(a(p), i) + p = p + 1 + end do + + do i = 1, NN + if (a(i) /= i*2) then + print *, "failed" + stop + endif + end do + print *, "passed" +end program diff --git a/sources/Example_linear_modifier.3.c b/sources/Example_linear_modifier.3.c new file mode 100644 index 0000000..186ae76 --- /dev/null +++ b/sources/Example_linear_modifier.3.c @@ -0,0 +1,45 @@ +/* +* @@name: linear_modifier.3c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: success +* @@version: omp_4.5 +*/ +#include + +#define N 128 + +#pragma omp declare simd simdlen(4) uniform(x, y) linear(val(i):1) +double func(double x[], double y[], int i) +{ + return (x[i] + y[i]); +} + +int main(void) +{ + double x[N], y[N], z1[N], z2; + int i, k; + + for (i = 0; i < N; i++) { + x[i] = (double)i; + y[i] = (double)i*2; + } + + k = 0; +#pragma omp simd linear(k) + for (i = 0; i < N; i++) { + z1[i] = func(x, y, k); + k++; + } + + for (i = 0; i < N; i++) { + z2 = (double)(i + i*2); + if (z1[i] != z2) { + printf("failed\n"); + return 1; + } + } + printf("passed\n"); + return 0; +} diff --git a/sources/Example_linear_modifier.3.f90 b/sources/Example_linear_modifier.3.f90 new file mode 100644 index 0000000..0ac0679 --- /dev/null +++ b/sources/Example_linear_modifier.3.f90 @@ -0,0 +1,47 @@ +! @@name: linear_modifier.3f +! @@type: F-free +! @@compilable: yes +! @@linkable: yes +! @@expect: success +! @@version: omp_4.5 +module func_mod +contains + real(8) function func(x, y, i) +!$omp declare simd(func) simdlen(4) uniform(x, y) linear(val(i):1) + implicit none + real(8), intent(in) :: x(*), y(*) + integer, intent(in) :: i + + func = x(i) + y(i) + + end function func +end module func_mod + +program main + use func_mod + implicit none + integer, parameter :: n = 128 + real(8) :: x(n), y(n), z1(n), z2 + integer :: i, k + + do i=1, n + x(i) = real(i, kind=8) + y(i) = real(i*2, kind=8) + enddo + + k = 1 +!$omp simd linear(k) + do i=1, n + z1(i) = func(x, y, k) + k = k + 1 + enddo + + do i=1, n + z2 = real(i+i*2, kind=8) + if (z1(i) /= z2) then + print *, 'failed' + stop + endif + enddo + print *, 'passed' +end program main diff --git a/sources/Example_loop.1.c b/sources/Example_loop.1.c index 4b6dc85..4acbc3b 100644 --- a/sources/Example_loop.1.c +++ b/sources/Example_loop.1.c @@ -1,9 +1,10 @@ /* * @@name: loop.2c * @@type: C -* @@compilable: yes, omp_5.0 +* @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_5.0 */ #include #define N 100 diff --git a/sources/Example_loop.1.f90 b/sources/Example_loop.1.f90 index 23c66e8..97e0953 100644 --- a/sources/Example_loop.1.f90 +++ b/sources/Example_loop.1.f90 @@ -1,14 +1,16 @@ ! @@name: loop.2f90 -! @@type: F-free, omp_5.0 +! @@type: F-free ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_5.0 + program main integer, parameter :: N=100 real :: x(N), y(N) real :: a = 2.0e0 - x=[i,i=1,N]; y=1.0e0 !! initialize + x=(/ (i,i=1,N) /); y=1.0e0 !! initialize !$omp parallel !$omp loop diff --git a/sources/Example_mem_model.1.c b/sources/Example_mem_model.1.c index 136f24c..cd5e543 100644 --- a/sources/Example_mem_model.1.c +++ b/sources/Example_mem_model.1.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: rt-error +* @@version: omp_3.1 */ #include #include @@ -16,20 +17,24 @@ int main(){ { if (omp_get_thread_num() == 0) { + #pragma omp atomic write x = 5; } else { - /* Print 1: the following read of x has a race */ - printf("1: Thread# %d: x = %d\n", omp_get_thread_num(),x ); + int xval; + #pragma omp atomic read + xval = x; + /* Print 1: xval can be 2 or 5 */ + printf("1: Thread# %d: x = %d\n", omp_get_thread_num(), xval); } #pragma omp barrier if (omp_get_thread_num() == 0) { /* Print 2 */ - printf("2: Thread# %d: x = %d\n", omp_get_thread_num(),x ); + printf("2: Thread# %d: x = %d\n", omp_get_thread_num(), x); } else { /* Print 3 */ - printf("3: Thread# %d: x = %d\n", omp_get_thread_num(),x ); + printf("3: Thread# %d: x = %d\n", omp_get_thread_num(), x); } } return 0; diff --git a/sources/Example_mem_model.1.f90 b/sources/Example_mem_model.1.f90 index 8530dcc..435cba9 100644 --- a/sources/Example_mem_model.1.f90 +++ b/sources/Example_mem_model.1.f90 @@ -3,18 +3,22 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: rt-error +! @@version: omp_3.1 PROGRAM MEMMODEL INCLUDE "omp_lib.h" ! or USE OMP_LIB - INTEGER X + INTEGER X, XVAL X = 2 !$OMP PARALLEL NUM_THREADS(2) SHARED(X) IF (OMP_GET_THREAD_NUM() .EQ. 0) THEN + !$OMP ATOMIC WRITE X = 5 ELSE - ! PRINT 1: The following read of x has a race - PRINT *,"1: THREAD# ", OMP_GET_THREAD_NUM(), "X = ", X + !$OMP ATOMIC READ + XVAL = X + ! PRINT 1: XVAL can be 2 or 5 + PRINT *,"1: THREAD# ", OMP_GET_THREAD_NUM(), "X = ", XVAL ENDIF !$OMP BARRIER diff --git a/sources/Example_mem_model.2.c b/sources/Example_mem_model.2.c index 38e49ad..0021c29 100644 --- a/sources/Example_mem_model.2.c +++ b/sources/Example_mem_model.2.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: rt-error +* @@version: omp_3.1 */ #include #include @@ -12,37 +13,35 @@ int main() int data; int flag=0; #pragma omp parallel num_threads(2) - { - if (omp_get_thread_num()==0) - { - /* Write to the data buffer that will be - read by thread */ - data = 42; - /* Flush data to thread 1 and strictly order - the write to data - relative to the write to the flag */ - #pragma omp flush(flag, data) - /* Set flag to release thread 1 */ - flag = 1; - /* Flush flag to ensure that thread 1 sees - the change */ - #pragma omp flush(flag) - } - else if(omp_get_thread_num()==1) - { - /* Loop until we see the update to the flag */ - #pragma omp flush(flag, data) - while (flag < 1) - { - #pragma omp flush(flag, data) - } - /* Values of flag and data are undefined */ - printf("flag=%d data=%d\n", flag, data); - #pragma omp flush(flag, data) - /* Values data will be 42, value of flag - still undefined */ - printf("flag=%d data=%d\n", flag, data); - } + { + if (omp_get_thread_num()==0) + { + /* Write to the data buffer that will be + * read by thread */ + data = 42; + /* Flush data to thread 1 and strictly order + * the write to data relative to the write to the flag */ + #pragma omp flush(flag, data) + /* Set flag to release thread 1 */ + #pragma omp atomic write + flag = 1; + } + else if(omp_get_thread_num()==1) + { + /* Loop until we see the update to the flag */ + #pragma omp flush(flag, data) + int flag_val = 0; + while (flag_val < 1) + { + #pragma omp atomic read + flag_val = flag; + } + /* Value of flag is 1; value of data is undefined */ + printf("flag=%d data=%d\n", flag, data); + #pragma omp flush(flag, data) + /* Value of flag is 1; value of data is 42 */ + printf("flag=%d data=%d\n", flag, data); + } } return 0; } diff --git a/sources/Example_mem_model.2.f b/sources/Example_mem_model.2.f index a612293..a323551 100644 --- a/sources/Example_mem_model.2.f +++ b/sources/Example_mem_model.2.f @@ -3,36 +3,42 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: rt-error +! @@version: omp_3.1 PROGRAM EXAMPLE INCLUDE "omp_lib.h" ! or USE OMP_LIB INTEGER DATA - INTEGER FLAG + INTEGER FLAG, FLAG_VAL FLAG = 0 - !$OMP PARALLEL NUM_THREADS(2) +!$OMP PARALLEL NUM_THREADS(2) IF(OMP_GET_THREAD_NUM() .EQ. 0) THEN - ! Write to the data buffer that will be read by thread 1 + ! Write to the data buffer that will be read by thread 1 DATA = 42 - ! Flush DATA to thread 1 and strictly order the write to DATA - ! relative to the write to the FLAG - !$OMP FLUSH(FLAG, DATA) - ! Set FLAG to release thread 1 - FLAG = 1; - ! Flush FLAG to ensure that thread 1 sees the change */ - !$OMP FLUSH(FLAG) + + ! Flush DATA to thread 1 and strictly order the write to DATA + ! relative to the write to the FLAG +!$OMP FLUSH(FLAG, DATA) + + ! Set FLAG to release thread 1 +!$OMP ATOMIC WRITE + FLAG = 1 + ELSE IF(OMP_GET_THREAD_NUM() .EQ. 1) THEN - ! Loop until we see the update to the FLAG - !$OMP FLUSH(FLAG, DATA) - DO WHILE(FLAG .LT. 1) - !$OMP FLUSH(FLAG, DATA) + ! Loop until we see the update to the FLAG +!$OMP FLUSH(FLAG, DATA) + FLAG_VAL = 0 + DO WHILE(FLAG_VAL .LT. 1) +!$OMP ATOMIC READ + FLAG_VAL = FLAG ENDDO - ! Values of FLAG and DATA are undefined + ! Value of FLAG is 1; value of DATA is undefined PRINT *, 'FLAG=', FLAG, ' DATA=', DATA - !$OMP FLUSH(FLAG, DATA) - !Values DATA will be 42, value of FLAG still undefined */ +!$OMP FLUSH(FLAG, DATA) + ! Value of FLAG is 1; value of DATA is 42 PRINT *, 'FLAG=', FLAG, ' DATA=', DATA + ENDIF - !$OMP END PARALLEL +!$OMP END PARALLEL END diff --git a/sources/Example_mem_model.3.c b/sources/Example_mem_model.3.c index fe6659f..f5bc444 100644 --- a/sources/Example_mem_model.3.c +++ b/sources/Example_mem_model.3.c @@ -4,9 +4,13 @@ * @@compilable: yes * @@linkable: yes * @@expect: rt-error +* @@version: omp_3.1 */ #include #include + +int data0 = 0, data1 = 0; + int main() { int flag=0; @@ -15,35 +19,44 @@ int main() { if(omp_get_thread_num()==0) { - /* Set flag to release thread 1 */ + data0 = 17; + #pragma omp flush + /* Set flag to release thread 1 */ #pragma omp atomic update flag++; - /* Flush of flag is implied by the atomic directive */ + /* Flush of flag is implied by the atomic directive */ } else if(omp_get_thread_num()==1) { - /* Loop until we see that flag reaches 1*/ - #pragma omp flush(flag) - while(flag < 1) + int flag_val = 0; + /* Loop until we see that flag reaches 1*/ + while(flag_val < 0) { - #pragma omp flush(flag) + #pragma omp atomic read + flag_val = flag; } - printf("Thread 1 awoken\n"); - - /* Set flag to release thread 2 */ + #pragma omp flush(data0) + /* data0 is 17 here */ + printf("Thread 1 awoken (data0 = %d)\n", data0); + data1 = 42; + #pragma omp flush(data1) + /* Set flag to release thread 2 */ #pragma omp atomic update flag++; - /* Flush of flag is implied by the atomic directive */ + /* Flush of flag is implied by the atomic directive */ } else if(omp_get_thread_num()==2) { - /* Loop until we see that flag reaches 2 */ - #pragma omp flush(flag) - while(flag < 2) + int flag_val = 0; + /* Loop until we see that flag reaches 2 */ + while(flag_val < 2) { - #pragma omp flush(flag) + #pragma omp atomic read + flag_val = flag; } - printf("Thread 2 awoken\n"); + #pragma omp flush(data0,data1) + /* there is a data race here; data0 is 17 and data1 is undefined */ + printf("Thread 2 awoken (data0 = %d, data1 = %d)\n", data0, data1); } } return 0; diff --git a/sources/Example_mem_model.3.f b/sources/Example_mem_model.3.f index 12a27e6..9a9a375 100644 --- a/sources/Example_mem_model.3.f +++ b/sources/Example_mem_model.3.f @@ -3,38 +3,57 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: rt-error +! @@version: omp_3.1 PROGRAM EXAMPLE INCLUDE "omp_lib.h" ! or USE OMP_LIB - INTEGER FLAG + INTEGER FLAG, FLAG_VAL + INTEGER DATA0, DATA1 FLAG = 0 - !$OMP PARALLEL NUM_THREADS(3) +!$OMP PARALLEL NUM_THREADS(3) IF(OMP_GET_THREAD_NUM() .EQ. 0) THEN - ! Set flag to release thread 1 - !$OMP ATOMIC UPDATE - FLAG = FLAG + 1 - !Flush of FLAG is implied by the atomic directive + DATA0 = 17 +!$OMP FLUSH + + ! Set flag to release thread 1 +!$OMP ATOMIC UPDATE + FLAG = FLAG + 1 + ! Flush of FLAG is implied by the atomic directive + ELSE IF(OMP_GET_THREAD_NUM() .EQ. 1) THEN - ! Loop until we see that FLAG reaches 1 - !$OMP FLUSH(FLAG) - DO WHILE(FLAG .LT. 1) - !$OMP FLUSH(FLAG) + ! Loop until we see that FLAG reaches 1 +!$OMP FLUSH(FLAG, DATA) + FLAG_VAL = 0 + DO WHILE(FLAG_VAL .LT. 1) +!$OMP ATOMIC READ + FLAG_VAL = FLAG ENDDO +!$OMP FLUSH - PRINT *, 'Thread 1 awoken' + ! DATA0 is 17 here + PRINT *, 'Thread 1 awoken. DATA0 = ', DATA0 + + DATA1 = 42 +!$OMP FLUSH(DATA1) + + ! Set FLAG to release thread 2 +!$OMP ATOMIC UPDATE + FLAG = FLAG + 1 + ! Flush of FLAG is implied by the atomic directive - ! Set FLAG to release thread 2 - !$OMP ATOMIC UPDATE - FLAG = FLAG + 1 - !Flush of FLAG is implied by the atomic directive ELSE IF(OMP_GET_THREAD_NUM() .EQ. 2) THEN - ! Loop until we see that FLAG reaches 2 - !$OMP FLUSH(FLAG) - DO WHILE(FLAG .LT. 2) - !$OMP FLUSH(FLAG) + ! Loop until we see that FLAG reaches 2 + FLAG_VAL = 0 + DO WHILE(FLAG_VAL .LT. 2) +!$OMP ATOMIC READ + FLAG_VAL = FLAG ENDDO +!$OMP FLUSH(DATA0, DATA1) + + ! There is a data race here; data0 is 17 and data1 is undefined + PRINT *, 'Thread 2 awoken. DATA0 = ', DATA0, + & ' and DATA1 = ', DATA1 - PRINT *, 'Thread 2 awoken' ENDIF - !$OMP END PARALLEL +!$OMP END PARALLEL END diff --git a/sources/Example_metadirective.1.c b/sources/Example_metadirective.1.c index db7c9db..c733138 100644 --- a/sources/Example_metadirective.1.c +++ b/sources/Example_metadirective.1.c @@ -1,9 +1,10 @@ /* * @@name: metadirective.1c * @@type: C -* @@compilable: yes, omp_5.0 +* @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_5.0 */ #define N 100 diff --git a/sources/Example_metadirective.1.f90 b/sources/Example_metadirective.1.f90 index 2d7d727..8b4fa75 100644 --- a/sources/Example_metadirective.1.f90 +++ b/sources/Example_metadirective.1.f90 @@ -1,8 +1,9 @@ ! @@name: metadirective.2f90 ! @@type: F-free -! @@compilable: yes, omp_5.0 +! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_5.0 program main integer, parameter :: N= 100 @@ -15,6 +16,7 @@ program main !$omp& when( device={arch("nvptx")}: teams loop) & !$omp& default( parallel loop) do i= 1,N; v3(i) = v1(i) * v2(i); enddo - + !$omp end target + print *, v3(1),v3(N) !!output: -1 -10000 end program diff --git a/sources/Example_metadirective.2.c b/sources/Example_metadirective.2.c index 9f55999..174e091 100644 --- a/sources/Example_metadirective.2.c +++ b/sources/Example_metadirective.2.c @@ -1,9 +1,10 @@ /* * @@name: metadirective.2c * @@type: C -* @@compilable: yes, omp_5.0 +* @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_5.0 */ #define N 100 @@ -16,9 +17,9 @@ int main() //Driver { int i,idev; - for (idev=0; idev #include diff --git a/sources/Example_metadirective.3.f90 b/sources/Example_metadirective.3.f90 index 7a4ca01..8d114a5 100644 --- a/sources/Example_metadirective.3.f90 +++ b/sources/Example_metadirective.3.f90 @@ -1,8 +1,9 @@ ! @@name: metadirective.3f90 ! @@type: F-free -! @@compilable: yes, omp_5.0 +! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_5.0 module params integer, parameter :: N=1000 @@ -39,6 +40,7 @@ program main !$omp target teams map(from: d) call exp_pi_diff(d,my_pi) + !$omp end target teams ! value should be near 1 print*, "d(N) = ",d(N) ! 1.00000000000311 diff --git a/sources/Example_parallel_master_taskloop.1.c b/sources/Example_parallel_master_taskloop.1.c index f96425f..7b2179b 100644 --- a/sources/Example_parallel_master_taskloop.1.c +++ b/sources/Example_parallel_master_taskloop.1.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_5.0 */ #include diff --git a/sources/Example_parallel_master_taskloop.1.f90 b/sources/Example_parallel_master_taskloop.1.f90 index 36d53fd..9b704df 100644 --- a/sources/Example_parallel_master_taskloop.1.f90 +++ b/sources/Example_parallel_master_taskloop.1.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_5.0 program main diff --git a/sources/Example_pra_iterator.1.cpp b/sources/Example_pra_iterator.1.cpp index 46b8499..569f3b0 100644 --- a/sources/Example_pra_iterator.1.cpp +++ b/sources/Example_pra_iterator.1.cpp @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_3.0 */ #include void iterator_example() diff --git a/sources/Example_reduction.1.c b/sources/Example_reduction.1.c index 45fcf13..4d64017 100644 --- a/sources/Example_reduction.1.c +++ b/sources/Example_reduction.1.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_3.1 */ #include void reduction1(float *x, int *y, int n) diff --git a/sources/Example_reduction.7.c b/sources/Example_reduction.7.c index 5a94085..da24bb5 100644 --- a/sources/Example_reduction.7.c +++ b/sources/Example_reduction.7.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.5 */ #include diff --git a/sources/Example_requires.1.cpp b/sources/Example_requires.1.cpp index 54a9418..31760e5 100644 --- a/sources/Example_requires.1.cpp +++ b/sources/Example_requires.1.cpp @@ -1,9 +1,10 @@ /* * @@name: requires.1cpp * @@type: C++ -* @@compilable: yes, omp_5.0 +* @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_5.0 */ #include diff --git a/sources/Example_requires.1.f90 b/sources/Example_requires.1.f90 index f8044f0..e5ed110 100644 --- a/sources/Example_requires.1.f90 +++ b/sources/Example_requires.1.f90 @@ -1,8 +1,9 @@ ! @@name: requires.1f90 ! @@type: F-free -! @@compilable: yes, omp_5.0 +! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_5.0 module data !$omp requires unified_shared_memory diff --git a/sources/Example_scan.1.c b/sources/Example_scan.1.c new file mode 100644 index 0000000..e8c2b3a --- /dev/null +++ b/sources/Example_scan.1.c @@ -0,0 +1,33 @@ +/* +* @@name: scan.1.c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: success +* @@version: omp_5.0 +*/ +#include +#define N 100 + +int main(void) +{ + int a[N], b[N]; + int x = 0; + + // initialization + for (int k = 0; k < N; k++) + a[k] = k + 1; + + // a[k] is included in the computation of producing results in b[k] + #pragma omp parallel for simd reduction(inscan,+: x) + for (int k = 0; k < N; k++) { + x += a[k]; + #pragma omp scan inclusive(x) + b[k] = x; + } + + printf("x = %d, b[0:3] = %d %d %d\n", x, b[0], b[1], b[2]); + // 5050, 1 3 6 + + return 0; +} diff --git a/sources/Example_scan.1.f90 b/sources/Example_scan.1.f90 new file mode 100644 index 0000000..dd35bfc --- /dev/null +++ b/sources/Example_scan.1.f90 @@ -0,0 +1,30 @@ +! @@name: scan.1.f +! @@type: F-free +! @@compilable: yes +! @@linkable: yes +! @@expect: success +! @@version: omp_5.0 +program inclusive_scan + implicit none + integer, parameter :: n = 100 + integer a(n), b(n) + integer x, k + + ! initialization + x = 0 + do k = 1, n + a(k) = k + end do + + ! a(k) is included in the computation of producing results in b(k) + !$omp parallel do simd reduction(inscan,+: x) + do k = 1, n + x = x + a(k) + !$omp scan inclusive(x) + b(k) = x + end do + + print *,'x =', x, ', b(1:3) =', b(1:3) + ! 5050, 1 3 6 + +end program diff --git a/sources/Example_scan.2.c b/sources/Example_scan.2.c new file mode 100644 index 0000000..7ac21f6 --- /dev/null +++ b/sources/Example_scan.2.c @@ -0,0 +1,33 @@ +/* +* @@name: scan.2.c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: success +* @@version: omp_5.0 +*/ +#include +#define N 100 + +int main(void) +{ + int a[N], b[N]; + int x = 0; + + // initialization + for (int k = 0; k < N; k++) + a[k] = k + 1; + + // a[k] is not included in the computation of producing results in b[k] + #pragma omp parallel for simd reduction(inscan,+: x) + for (int k = 0; k < N; k++) { + b[k] = x; + #pragma omp scan exclusive(x) + x += a[k]; + } + + printf("x = %d, b[0:3] = %d %d %d\n", x, b[0], b[1], b[2]); + // 5050, 0 1 3 + + return 0; +} diff --git a/sources/Example_scan.2.f90 b/sources/Example_scan.2.f90 new file mode 100644 index 0000000..b4fdda7 --- /dev/null +++ b/sources/Example_scan.2.f90 @@ -0,0 +1,30 @@ +! @@name: scan.2.f +! @@type: F-free +! @@compilable: yes +! @@linkable: yes +! @@expect: success +! @@version: omp_5.0 +program exclusive_scan + implicit none + integer, parameter :: n = 100 + integer a(n), b(n) + integer x, k + + ! initialization + x = 0 + do k = 1, n + a(k) = k + end do + + ! a(k) is not included in the computation of producing results in b(k) + !$omp parallel do simd reduction(inscan,+: x) + do k = 1, n + b(k) = x + !$omp scan exclusive(x) + x = x + a(k) + end do + + print *,'x =', x, ', b(1:3) =', b(1:3) + ! 5050, 0 1 3 + +end program diff --git a/sources/Example_standalone.1.c b/sources/Example_standalone.1.c index 1562fe7..24d875d 100644 --- a/sources/Example_standalone.1.c +++ b/sources/Example_standalone.1.c @@ -4,6 +4,7 @@ * @@compilable: no * @@linkable: no * @@expect: failure +* @@version: omp_3.1 */ void standalone_wrong() diff --git a/sources/Example_standalone.1.f90 b/sources/Example_standalone.1.f90 index ed2d55b..f994c29 100644 --- a/sources/Example_standalone.1.f90 +++ b/sources/Example_standalone.1.f90 @@ -3,6 +3,7 @@ ! @@compilable: no ! @@linkable: no ! @@expect: failure +! @@version: omp_3.1 SUBROUTINE STANDALONE_WRONG() diff --git a/sources/Example_standalone.2.c b/sources/Example_standalone.2.c index cc14535..19f1420 100644 --- a/sources/Example_standalone.2.c +++ b/sources/Example_standalone.2.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_3.1 */ void standalone_ok() { diff --git a/sources/Example_standalone.2.f90 b/sources/Example_standalone.2.f90 index 5e2347a..3eec837 100644 --- a/sources/Example_standalone.2.f90 +++ b/sources/Example_standalone.2.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_3.1 SUBROUTINE STANDALONE_OK() INTEGER A A = 1 diff --git a/sources/Example_target.1.c b/sources/Example_target.1.c index d9d0820..4c5d094 100644 --- a/sources/Example_target.1.c +++ b/sources/Example_target.1.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ extern void init(float*, float*, int); extern void output(float*, int); diff --git a/sources/Example_target.1.f90 b/sources/Example_target.1.f90 index a8f9f94..e38026a 100644 --- a/sources/Example_target.1.f90 +++ b/sources/Example_target.1.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 subroutine vec_mult(N) integer :: i,N real :: p(N), v1(N), v2(N) diff --git a/sources/Example_target.2.c b/sources/Example_target.2.c index d42e78a..83d07e6 100644 --- a/sources/Example_target.2.c +++ b/sources/Example_target.2.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ extern void init(float*, float*, int); extern void output(float*, int); diff --git a/sources/Example_target.2.f90 b/sources/Example_target.2.f90 index eddf65b..936b62b 100644 --- a/sources/Example_target.2.f90 +++ b/sources/Example_target.2.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 subroutine vec_mult(N) integer :: i,N real :: p(N), v1(N), v2(N) diff --git a/sources/Example_target.3.c b/sources/Example_target.3.c index 83cdb16..ef05790 100644 --- a/sources/Example_target.3.c +++ b/sources/Example_target.3.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ extern void init(float*, float*, int); extern void output(float*, int); diff --git a/sources/Example_target.3.f90 b/sources/Example_target.3.f90 index 372878c..9bf85de 100644 --- a/sources/Example_target.3.f90 +++ b/sources/Example_target.3.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 subroutine vec_mult(N) integer :: i,N real :: p(N), v1(N), v2(N) diff --git a/sources/Example_target.4.c b/sources/Example_target.4.c index 0d9a63c..c481fd5 100644 --- a/sources/Example_target.4.c +++ b/sources/Example_target.4.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ extern void init(float*, float*, int); extern void output(float*, int); diff --git a/sources/Example_target.4.f90 b/sources/Example_target.4.f90 index bc85adb..c6c2dfc 100644 --- a/sources/Example_target.4.f90 +++ b/sources/Example_target.4.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 module mults contains subroutine vec_mult(p,v1,v2,N) diff --git a/sources/Example_target.4b.f90 b/sources/Example_target.4b.f90 index 1d8ae3d..7b6ac71 100644 --- a/sources/Example_target.4b.f90 +++ b/sources/Example_target.4b.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 module mults contains subroutine vec_mult(p,v1,v2,N) diff --git a/sources/Example_target.5.c b/sources/Example_target.5.c index c29b70e..eb93084 100644 --- a/sources/Example_target.5.c +++ b/sources/Example_target.5.c @@ -4,19 +4,25 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ #define THRESHOLD1 1000000 #define THRESHOLD2 1000 + extern void init(float*, float*, int); extern void output(float*, int); + void vec_mult(float *p, float *v1, float *v2, int N) { int i; + init(v1, v2, N); + #pragma omp target if(N>THRESHOLD1) map(to: v1[0:N], v2[:N])\ map(from: p[0:N]) #pragma omp parallel for if(N>THRESHOLD2) for (i=0; iTHRESHHOLD1) map(to: v1, v2 ) map(from: p) !$omp parallel do if(N>THRESHOLD2) do i=1,N p(i) = v1(i) * v2(i) end do !$omp end target + call output(p, N) end subroutine diff --git a/sources/Example_target.6.c b/sources/Example_target.6.c index 4ac2afc..62babdc 100644 --- a/sources/Example_target.6.c +++ b/sources/Example_target.6.c @@ -4,19 +4,25 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.5 */ #define THRESHOLD1 1000000 #define THRESHOLD2 1000 + extern void init(float*, float*, int); extern void output(float*, int); + void vec_mult(float *p, float *v1, float *v2, int N) { int i; + init(v1, v2, N); + #pragma omp target parallel for \ if(target: N>THRESHOLD1) if(parallel: N>THRESHOLD2) \ map(to: v1[0:N], v2[:N]) map(from: p[0:N]) for (i=0; iTHRESHHOLD1) if(parallel: N>THRESHOLD2) & !$omp& map(to: v1, v2 ) map(from: p) @@ -18,5 +22,6 @@ subroutine vec_mult(p, v1, v2, N) p(i) = v1(i) * v2(i) end do !$omp end target parallel do + call output(p, N) end subroutine diff --git a/sources/Example_target_data.1.c b/sources/Example_target_data.1.c index 9bfea76..c13f93d 100644 --- a/sources/Example_target_data.1.c +++ b/sources/Example_target_data.1.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ extern void init(float*, float*, int); extern void output(float*, int); diff --git a/sources/Example_target_data.1.f90 b/sources/Example_target_data.1.f90 index 9c79fd9..2c4f32d 100644 --- a/sources/Example_target_data.1.f90 +++ b/sources/Example_target_data.1.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 subroutine vec_mult(p, v1, v2, N) real :: p(N), v1(N), v2(N) integer :: i diff --git a/sources/Example_target_data.2.c b/sources/Example_target_data.2.c index 9155a9a..b545449 100644 --- a/sources/Example_target_data.2.c +++ b/sources/Example_target_data.2.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ extern void init(float*, float*, int); extern void init_again(float*, float*, int); diff --git a/sources/Example_target_data.2.f90 b/sources/Example_target_data.2.f90 index 1a450d3..9b1fabd 100644 --- a/sources/Example_target_data.2.f90 +++ b/sources/Example_target_data.2.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 subroutine vec_mult(p, v1, v2, N) real :: p(N), v1(N), v2(N) integer :: i diff --git a/sources/Example_target_data.3.c b/sources/Example_target_data.3.c index 05cb61d..e2d62d9 100644 --- a/sources/Example_target_data.3.c +++ b/sources/Example_target_data.3.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ #include diff --git a/sources/Example_target_data.3.f90 b/sources/Example_target_data.3.f90 index 026f77e..1032177 100644 --- a/sources/Example_target_data.3.f90 +++ b/sources/Example_target_data.3.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 subroutine gramSchmidt(Q,rows,cols) integer :: rows,cols, i,k double precision :: Q(rows,cols), tmp diff --git a/sources/Example_target_data.4.c b/sources/Example_target_data.4.c index 8f66094..89b329f 100644 --- a/sources/Example_target_data.4.c +++ b/sources/Example_target_data.4.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ diff --git a/sources/Example_target_data.4.f90 b/sources/Example_target_data.4.f90 index 4401202..e7cd232 100644 --- a/sources/Example_target_data.4.f90 +++ b/sources/Example_target_data.4.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 module mults contains diff --git a/sources/Example_target_data.5.cpp b/sources/Example_target_data.5.cpp index fdfd990..f603afd 100644 --- a/sources/Example_target_data.5.cpp +++ b/sources/Example_target_data.5.cpp @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ void vec_mult(float* &, float* &, float* &, int &); extern void init(float*, float*, int); diff --git a/sources/Example_target_data.5.f90 b/sources/Example_target_data.5.f90 index f9e8eaa..79d0c45 100644 --- a/sources/Example_target_data.5.f90 +++ b/sources/Example_target_data.5.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 module my_mult contains subroutine foo(p0,v1,v2,N) diff --git a/sources/Example_target_data.6.c b/sources/Example_target_data.6.c index c0a8b07..d912a4b 100644 --- a/sources/Example_target_data.6.c +++ b/sources/Example_target_data.6.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ #define THRESHOLD 1000000 extern void init(float*, float*, int); diff --git a/sources/Example_target_data.6.f90 b/sources/Example_target_data.6.f90 index 52ca758..8b197c9 100644 --- a/sources/Example_target_data.6.f90 +++ b/sources/Example_target_data.6.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 module params integer,parameter :: THRESHOLD=1000000 end module diff --git a/sources/Example_target_data.7.c b/sources/Example_target_data.7.c index 138956c..a07832e 100644 --- a/sources/Example_target_data.7.c +++ b/sources/Example_target_data.7.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ #define THRESHOLD 1000000 extern void init(float*, float*, int); diff --git a/sources/Example_target_data.7.f90 b/sources/Example_target_data.7.f90 index 8c443b9..da54d4e 100644 --- a/sources/Example_target_data.7.f90 +++ b/sources/Example_target_data.7.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 module params integer, parameter :: THRESHOLD=1000000 end module diff --git a/sources/Example_target_defaultmap.1.c b/sources/Example_target_defaultmap.1.c new file mode 100644 index 0000000..f0b5acb --- /dev/null +++ b/sources/Example_target_defaultmap.1.c @@ -0,0 +1,93 @@ +/* +* @@name: target_defaultmap.1.c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: success +* @@version: omp_5.0 +*/ +#include +#include +#define N 2 + +int main(){ + typedef struct S_struct { int s; int A[N]; } S_struct_t; + + + int s; //scalar int variable (scalar) + int A[N]; //aggregate variable (array) + S_struct_t S; //aggregate variable (structure) + int *ptr; //scalar, pointer variable (pointer) + + int s1, s2, s3; + +// Initialize everything to zero; + s=2; s1=s2=s3=0; + A[0]=0; A[1]=0; + S.s=0; S.A[0]=0; S.A[1]=0; + +// Target Region 1 + // Uses defaultmap to set scalars, aggregates & pointers + // to normal defaults. + #pragma omp target \ + defaultmap(firstprivate: scalar) //could also be default \ + defaultmap(tofrom: aggregate) //could also be default \ + defaultmap(default: pointer) //must be default \ + map(ptr2m[:N]) + { + s = 3; // SCALAR firstprivate, value not returned + + A[0] = 3; A[1] = 3; // AGGREGATE array, default map tofrom + + // AGGREGATE structure, default tofrom + S.s = 2; + S.A[0] = 2; S.A[1] = 2; + + ptr = &A[0]; // POINTER is private + ptr[0] = 2; ptr[1] = 2; + + } + if(s==2 && A[0]==2 && S.s==2 && S.A[0]==2) + printf(" PASSED 1 of 4\n"); + + +// Target Region 2 + // no implicit mapping allowed. + #pragma omp target defaultmap(none) map(tofrom: s, A, S) + { + s +=5; // All variables must be explicitly mapped + A[0] +=5; A[1]+=5; + S.s +=5; + S.A[0]+=5; S.A[1]+=5; + } + if(s==7 && A[0]==7 && S.s==7 && S.A[0]==7) printf(" PASSED 2 of 4\n"); + + +// Target Region 3 + // defaultmap & explicit map with variables in same category + s1=s2=s3=1; + #pragma omp defaultmap(tofrom: scalar) map(firstprivate: s1,s2) + { + s1 += 5; // firstprivate (s1 value not returned to host) + s2 += 5; // firstprivate (s2 value not returned to host) + s3 += s1 + s2; // mapped as tofrom + } + if(s1==1 && s2==1 && s3==13 ) printf(" PASSED 3 of 4\n"); + + +// Target Region 4 + A[0]=0; A[1]=0; + S.A[0]=0; S.A[1]=0; + + // arrays and structure are firstprivate, and scalars are from + #pragma omp target defaultmap(firstprivate: aggregate) map(from: s1, s2) + { + + A[0]+=1; S.A[0]+=1; //Aggregate changes not returned to host + A[1]+=1; S.A[1]+=1; //Aggregate changes not returned to host + s1 = A[0]+S.A[0]; //s1 value returned to host + s2 = A[1]+S.A[1]; //s1 value returned to host + } + if( A[0]==0 && S.A[0]==0 && s1==2 ) printf(" PASSED 4 of 4\n"); + +} diff --git a/sources/Example_target_defaultmap.1.f90 b/sources/Example_target_defaultmap.1.f90 new file mode 100644 index 0000000..4b6d8da --- /dev/null +++ b/sources/Example_target_defaultmap.1.f90 @@ -0,0 +1,105 @@ +! @@name: defaultmap.1f90 +! @@type: F-free +! @@compilable: yes +! @@linkable: yes +! @@expect: success +! @@version: omp_5.0 +program defaultmap + integer, parameter :: N=2 + + type DDT_sA + integer :: s + integer :: A(N) + end type + + integer :: s,s1,s2,s3 !! SCALAR: variable (integer) + + integer,target :: A(N) !! AGGREGATE: Array + type(DDT_sA) :: D !! AGGREGATE: Derived Data Type (D) + + integer,allocatable :: H(:) !! ALLOCATABLE: Heap allocated array + + integer,pointer :: ptrA(:) !! POINTER: points to Array + + ! Assign vaues to scalar, Array, Allocatable, and Pointers + + s=2; + s1=0; s2=0; s3=0 + D%s=0; D%A(1)=0; D%A(2)=0 + A(1)=0; A(2)=0 + + allocate( H(2) ) + H(1)=0; H(2)=0 + +!! Target Region 1 + !! Using defaultmap to set scalars, aggregates & pointers + !! and allocatables to normal defaults. + !$omp target & + !$omp& defaultmap( firstprivate: scalar) & + !$omp& defaultmap( tofrom: aggregate) & + !$omp& defaultmap( tofrom: allocatable) & + !$omp& defaultmap( default: pointer) + + s = 3 !! SCALAR firstprivate, value not returned + + A(1) = 3 !! AGGREGATE array, default map tofrom + A(2) = 3 + + D%s = 2 !! AGGR. Derived Types, default map tofrom + D%A(1) = 2; D%A(2) = 2 + + H(1) = 2; H(2) = 2 !! ALLOCATABLE, default map tofrom + + ptrA=>A !! POINTER is private + ptrA(1) = 2; ptrA(2) = 2 + + !$omp end target + + if(s==2 .and. A(1)==2 .and. D%s==2 .and. D%A(1)==2 .and. H(1) == 2) & + print*," PASSED 1 of 4" + +!! Target Region 2 + !! no implicit mapping allowed + !$omp target defaultmap(none) map(tofrom: s, A, D) + + s=s+5 !! All variables must be explicitly mapped + A(1)=A(1)+5; A(2)=A(2)+5 + D%s=D%s+5 + D%A(1)=D%A(1)+5; D%A(2)=D%A(2)+5 + + !$omp end target + if(s==7 .and. A(1)==7 .and. D%s==7 .and. D%A(1)==7) print*," PASSED 2 of 4" + +!! Target Region 3 + !!defaultmap & explicit map with variables in same category + s1=1; s2=1; s3=1 + !$omp defaultmap(tofrom: scalar) map(firstprivate: s1,s2) + + s1 = s1+5; !! firstprivate (s1 value not returned to host) + s2 = s2+5; !! firstprivate (s2 value not returned to host) + s3 = s3 +s1 + s2; !! mapped as tofrom + + !$omp end target + if(s1==1 .and. s2==1 .and. s3==13) print*," PASSED 3 of 4" + +!! Target Region 4 + A(1)=0; A(2)=0 + D%A(1)=0; D%A(2)=0 + H(1)=0; H(2)=0 + !! non-allocated arrays & derived types are in AGGREGATE cat. + !! Allocatable Arrays are in ALLOCATABLE category + !! Scalars are explicitly mapped from + !$omp target defaultmap(firstprivate: aggregate ) & + !$omp& defaultmap(firstprivate: allocatable) & + !$omp& map(from: s1, s2) + + A(1)=A(1)+1; D%A(1)=D%A(1)+1; H(1)=H(1)+1 !!changes not returned to host + A(2)=A(2)+1; D%A(2)=D%A(2)+1; H(2)=H(2)+1 !!changes not returned to host + s1 = A(1)+D%A(1)+H(1) !!s1 returned to host + s2 = A(2)+D%A(2)+H(1) !!s2 returned to host + + !$omp end target + if(A(1)==0 .and. D%A(1)==0 .and. H(1)==0 .and. s1==3) & + print*," PASSED 4 of 4" + +end program diff --git a/sources/Example_target_mapper.1.c b/sources/Example_target_mapper.1.c index 0a710af..c6f6fc2 100644 --- a/sources/Example_target_mapper.1.c +++ b/sources/Example_target_mapper.1.c @@ -1,9 +1,10 @@ /* * @@name: target_mapper_map.1c * @@type: C -* @@compilable: yes, omp_5.0 +* @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_5.0 */ #include #include @@ -19,7 +20,6 @@ typedef struct myvec{ void init(myvec_t *s); int main(){ - myvec_t s; s.data = (double *)calloc(N,sizeof(double)); @@ -33,4 +33,3 @@ int main(){ void init(myvec_t *s) { for(int i=0; ilen; i++) s->data[i]=i; } - diff --git a/sources/Example_target_mapper.1.f90 b/sources/Example_target_mapper.1.f90 index 17af08f..f063481 100644 --- a/sources/Example_target_mapper.1.f90 +++ b/sources/Example_target_mapper.1.f90 @@ -1,8 +1,10 @@ ! @@name: target_mapper.1.f90 ! @@type: F-free -! @@compilable: yes, omp_5.0 +! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_5.0 + module my_structures type myvec_t integer :: len diff --git a/sources/Example_target_mapper.2.c b/sources/Example_target_mapper.2.c index f1c86d1..b810bf6 100644 --- a/sources/Example_target_mapper.2.c +++ b/sources/Example_target_mapper.2.c @@ -1,9 +1,10 @@ /* * @@name: target_mapper_map.2.c * @@type: C -* @@compilable: yes, omp_5.0 +* @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_5.0 */ #include // N MUST BE EVEN diff --git a/sources/Example_target_mapper.2.f90 b/sources/Example_target_mapper.2.f90 index 663d76d..45e2822 100644 --- a/sources/Example_target_mapper.2.f90 +++ b/sources/Example_target_mapper.2.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_5.0 module complex_mats integer, parameter :: N=100 !N must be even diff --git a/sources/Example_target_mapper.3.c b/sources/Example_target_mapper.3.c index dc680ed..b2f6e6b 100644 --- a/sources/Example_target_mapper.3.c +++ b/sources/Example_target_mapper.3.c @@ -1,9 +1,10 @@ /* * @@name: target_mapper_map.3.c * @@type: C -* @@compilable: yes, omp_5.0 +* @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_5.0 */ #include diff --git a/sources/Example_target_mapper.3.f90 b/sources/Example_target_mapper.3.f90 index 1e3d326..75db578 100644 --- a/sources/Example_target_mapper.3.f90 +++ b/sources/Example_target_mapper.3.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_5.0 module my_structures type myvec_t diff --git a/sources/Example_target_offload_control.1.c b/sources/Example_target_offload_control.1.c index 201127c..b0b68a9 100644 --- a/sources/Example_target_offload_control.1.c +++ b/sources/Example_target_offload_control.1.c @@ -1,9 +1,10 @@ /* * @@name: target_offload_control.1c * @@type: C -* @@compilable: yes, omp_5.0 +* @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_5.0 */ #include diff --git a/sources/Example_target_offload_control.1.f90 b/sources/Example_target_offload_control.1.f90 index 6561606..85cb956 100644 --- a/sources/Example_target_offload_control.1.f90 +++ b/sources/Example_target_offload_control.1.f90 @@ -1,8 +1,9 @@ ! @@name: target_offload_control.1f90 ! @@type: F-free -! @@compilable: yes, omp_5.0 +! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_5.0 module offload_policy diff --git a/sources/Example_target_ptr_map.1.c b/sources/Example_target_ptr_map.1.c index 404cfee..64d3693 100644 --- a/sources/Example_target_ptr_map.1.c +++ b/sources/Example_target_ptr_map.1.c @@ -1,9 +1,10 @@ /* -* @@name: target_pointer_map.1 +* @@name: target_ptr_map.1 * @@type: C * @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_5.0 */ #include #include diff --git a/sources/Example_target_ptr_map.2.c b/sources/Example_target_ptr_map.2.c index 0bad89e..f8d3195 100644 --- a/sources/Example_target_ptr_map.2.c +++ b/sources/Example_target_ptr_map.2.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_5.0 */ #include #include diff --git a/sources/Example_target_ptr_map.3a.c b/sources/Example_target_ptr_map.3a.c new file mode 100644 index 0000000..3e8c754 --- /dev/null +++ b/sources/Example_target_ptr_map.3a.c @@ -0,0 +1,43 @@ +/* +* @@name: target_ptr_map.3a.c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: failure +* @@version: omp_5.0 +*/ +#define N 100 + +int x[N], y[N]; +#pragma omp declare target +int *p1; +#pragma omp end declare target +int *p2; + +int foo() +{ + p1 = &x[0]; + p2 = &y[0]; + + // Explicitly map array section x[:N] + #pragma omp target enter data map(x[:N]) + + #pragma omp target // as if .. map(p1) map(p1[:0]) map(p2[:0]) map(y) + { + // Accessing the mapped arrays x,y is OK here. + x[0] = 1; + y[1] = 2; + + // Pointer attachment for p1 does not occur here + // because p1[:0] does not allocate a new array section and + // array x is present on the target construct as it was mapped + // before by the target enter data directive. + p1[0] = 3; // accessing p1 is undefined + + // The initial value of p2 in the target region is undefined + // because map(y) may occur after map(p2[:0]). + p2[1] = 4; // accessing p2 is undefined + } + + return 0; +} diff --git a/sources/Example_target_ptr_map.3b.c b/sources/Example_target_ptr_map.3b.c new file mode 100644 index 0000000..743121c --- /dev/null +++ b/sources/Example_target_ptr_map.3b.c @@ -0,0 +1,40 @@ +/* +* @@name: target_ptr_map.3b.c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +* @@version: omp_5.0 +*/ +#define N 100 + +int x[N], y[N]; +#pragma omp declare target +int *p1; +#pragma omp end declare target +int *p2; + +int foo() +{ + p1 = &x[0]; + p2 = &y[0]; + + // Explicitly map array section y[:N] + #pragma omp target enter data map(y[:N]) + + #pragma omp target map(x[:N]) map(p1[:N]) map(p2[:0]) + { + // Accessing the mapped arrays x,y is OK here. + x[0] = 1; + y[1] = 2; + + // Pointer attachment for p1 occurs here when array x is mapped + // on the target construct (as p1 = &x[0] on the device) + p1[0] = 3; // accessing p1 is OK + + // p2 in the target region is initialized to &y[0] + p2[1] = 4; // accessing p2 is OK + } + + return 0; +} diff --git a/sources/Example_target_reduction.1.c b/sources/Example_target_reduction.1.c new file mode 100644 index 0000000..63f9f5c --- /dev/null +++ b/sources/Example_target_reduction.1.c @@ -0,0 +1,34 @@ +/* +* @@name: target_reduction.1.c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: success +* @@version: omp_5.0 +*/ +#include +int f(int); +int g(int); +int main() +{ + int sum1=0, sum2=0; + int i; + const int n = 100; + + #pragma omp target teams distribute reduction(+:sum1) + for (int i = 0; i < n; i++) { + sum1 += f(i); + } + + #pragma omp target teams distribute reduction(+:sum2) + for (int i = 0; i < n; i++) { + sum2 += g(i) * sum1; + } + + printf( "sum1 = %d, sum2 = %d\n", sum1, sum2); + //OUTPUT: sum1 = 9900, sum2 = 147015000 + return 0; +} + +int f(int res){ return res*2; } +int g(int res){ return res*3; } diff --git a/sources/Example_target_reduction.1.f90 b/sources/Example_target_reduction.1.f90 new file mode 100644 index 0000000..5818d0d --- /dev/null +++ b/sources/Example_target_reduction.1.f90 @@ -0,0 +1,40 @@ +! @@name: target_reduction.1.f90 +! @@type: F-free +! @@compilable: yes, omp_5.0 +! @@linkable: yes +! @@expect: success +! @@version: omp_5.0 +program target_reduction_ex1 + interface + function f(res) + integer :: f, res + end function + function g(res) + integer :: g, res + end function + end interface + integer :: sum1, sum2, i + integer, parameter :: n = 100 + sum1 = 0 + sum2 = 0 + !$omp target teams distribute reduction(+:sum1) + do i=1,n + sum1 = sum1 + f(i) + end do + !$omp target teams distribute reduction(+:sum2) + do i=1,n + sum2 = sum2 + g(i)*sum1 + end do + print *, "sum1 = ", sum1, ", sum2 = ", sum2 + !!OUTPUT: sum1 = 10100 , sum2 = 153015000 +end program + + +integer function f(res) + integer :: res + f = res*2 +end function +integer function g(res) + integer :: res + g = res*3 +end function diff --git a/sources/Example_target_reduction.2.c b/sources/Example_target_reduction.2.c new file mode 100644 index 0000000..f367bfd --- /dev/null +++ b/sources/Example_target_reduction.2.c @@ -0,0 +1,36 @@ +/* +* @@name: target_reduction.2.c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: success +* @@version: omp_5.0 +*/ +#include +int f(int); +int g(int); +int main() +{ + int sum1=0, sum2=0; + int i; + const int n = 100; + + #pragma omp target data map(sum1,sum2) + { + #pragma omp target teams distribute reduction(+:sum1) + for (int i = 0; i < n; i++) { + sum1 += f(i); + } + + #pragma omp target teams distribute map(sum1) reduction(+:sum2) + for (int i = 0; i < n; i++) { + sum2 += g(i) * sum1; + } + } + printf( "sum1 = %d, sum2 = %d\n", sum1, sum2); + //OUTPUT: sum1 = 9900, sum2 = 147015000 + return 0; +} + +int f(int res){ return res*2; } +int g(int res){ return res*3; } diff --git a/sources/Example_target_reduction.2.f90 b/sources/Example_target_reduction.2.f90 new file mode 100644 index 0000000..4557181 --- /dev/null +++ b/sources/Example_target_reduction.2.f90 @@ -0,0 +1,43 @@ +! @@name: target_reduction.2.f90 +! @@type: F-free +! @@compilable: yes +! @@linkable: yes +! @@expect: success +! @@version: omp_5.0 + +program target_reduction_ex2 + interface + function f(res) + integer :: f, res + end function + function g(res) + integer :: g, res + end function + end interface + integer :: sum1, sum2, i + integer, parameter :: n = 100 + sum1 = 0 + sum2 = 0 + !$omp target data map(sum1, sum2) + !$omp target teams distribute reduction(+:sum1) + do i=1,n + sum1 = sum1 + f(i) + end do + !$omp target teams distribute map(sum1) reduction(+:sum2) + do i=1,n + sum2 = sum2 + g(i)*sum1 + end do + !$omp end target data + print *, "sum1 = ", sum1, ", sum2 = ", sum2 + !!OUTPUT: sum1 = 10100 , sum2 = 153015000 +end program + + +integer function f(res) + integer :: res + f = res*2 +end function +integer function g(res) + integer :: res + g = res*3 +end function diff --git a/sources/Example_target_reverse_offload.7.c b/sources/Example_target_reverse_offload.7.c index c26b0c1..42d5525 100644 --- a/sources/Example_target_reverse_offload.7.c +++ b/sources/Example_target_reverse_offload.7.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_5.0 */ #include diff --git a/sources/Example_target_reverse_offload.7.f90 b/sources/Example_target_reverse_offload.7.f90 index c99122f..6fce764 100644 --- a/sources/Example_target_reverse_offload.7.f90 +++ b/sources/Example_target_reverse_offload.7.f90 @@ -3,11 +3,12 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_5.0 !$omp requires reverse_offload subroutine error_handler(wrong_value, index) - integer :: error_value,index + integer :: wrong_value,index !$omp declare target device_type(host) write( *,'("Error in offload: A(",i3,")=",i3)' ) index,wrong_value @@ -27,9 +28,9 @@ program rev_off !$omp target map(A) do i=1,N if (A(i) /= i) then - !$omp omp target device(ancestor: 1) map(always,to :A(i)) + !$omp target device(ancestor: 1) map(always,to :A(i)) call error_handler(A(i), i) - !$omp omp end target + !$omp end target endif end do !$omp end target diff --git a/sources/Example_target_struct_map.1.c b/sources/Example_target_struct_map.1.c index f79e5d8..b358afb 100644 --- a/sources/Example_target_struct_map.1.c +++ b/sources/Example_target_struct_map.1.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_5.0 */ #include #include diff --git a/sources/Example_target_struct_map.2.c b/sources/Example_target_struct_map.2.c index 348acb6..b99464f 100644 --- a/sources/Example_target_struct_map.2.c +++ b/sources/Example_target_struct_map.2.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_5.0 */ #include #include diff --git a/sources/Example_target_struct_map.2.cpp b/sources/Example_target_struct_map.2.cpp index e35ec9b..303dc68 100644 --- a/sources/Example_target_struct_map.2.cpp +++ b/sources/Example_target_struct_map.2.cpp @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_5.0 */ #include #include diff --git a/sources/Example_target_task_reduction.1.c b/sources/Example_target_task_reduction.1.c new file mode 100644 index 0000000..9011629 --- /dev/null +++ b/sources/Example_target_task_reduction.1.c @@ -0,0 +1,32 @@ +/* +* @@name: target_task_reduction.1.c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: success +* @@version: omp_5.0 +*/ +#include +#pragma omp declare target to(device_compute) +void device_compute(int *); +void host_compute(int *); +int main() +{ + int sum = 0; + + #pragma omp parallel master + #pragma omp taskgroup task_reduction(+:sum) + { + #pragma omp target in_reduction(+:sum) nowait + device_compute(&sum); + + #pragma omp task in_reduction(+:sum) + host_compute(&sum); + } + printf( "sum = %d\n", sum); + //OUTPUT: sum = 2 + return 0; +} + +void device_compute(int *sum){ *sum = 1; } +void host_compute(int *sum){ *sum = 1; } diff --git a/sources/Example_target_task_reduction.1.f90 b/sources/Example_target_task_reduction.1.f90 new file mode 100644 index 0000000..b66851f --- /dev/null +++ b/sources/Example_target_task_reduction.1.f90 @@ -0,0 +1,40 @@ +! @@name: target_task_reduction.1.f90 +! @@type: F-free +! @@compilable: yes +! @@linkable: no +! @@expect: success +! @@version: omp_5.0 +program target_task_reduction_ex1 + interface + subroutine device_compute(res) + !$omp declare target to(device_compute) + integer :: res + end subroutine device_compute + subroutine host_compute(res) + integer :: res + end subroutine host_compute + end interface + integer :: sum + sum = 0 + !$omp parallel master + !$omp taskgroup task_reduction(+:sum) + !$omp target in_reduction(+:sum) nowait + call device_compute(sum) + !$omp end target + !$omp task in_reduction(+:sum) + call host_compute(sum) + !$omp end task + !$omp end taskgroup + !$omp end parallel master + print *, "sum = ", sum + !!OUTPUT: sum = 2 +end program + +subroutine device_compute(sum) + integer :: sum + sum = 1 +end subroutine +subroutine host_compute(sum) + integer :: sum + sum = 1 +end subroutine diff --git a/sources/Example_target_task_reduction.2a.c b/sources/Example_target_task_reduction.2a.c new file mode 100644 index 0000000..9802459 --- /dev/null +++ b/sources/Example_target_task_reduction.2a.c @@ -0,0 +1,35 @@ +/* +* @@name: target_task_reduction.2.c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: success +* @@version: omp_5.0 +*/ +#include +#pragma omp declare target to(device_compute) +extern void device_compute(int *); +extern void host_compute(int *); +int main() +{ + int sum = 0; + + #pragma omp parallel sections reduction(task, +:sum) + { + #pragma omp section + { + #pragma omp target in_reduction(+:sum) + device_compute(&sum); + } + #pragma omp section + { + host_compute(&sum); + } + } + printf( "sum = %d\n", sum); + //OUTPUT: sum = 2 + return 0; +} + +void device_compute(int *sum){ *sum = 1; } +void host_compute(int *sum){ *sum = 1; } diff --git a/sources/Example_target_task_reduction.2a.f90 b/sources/Example_target_task_reduction.2a.f90 new file mode 100644 index 0000000..4487a7c --- /dev/null +++ b/sources/Example_target_task_reduction.2a.f90 @@ -0,0 +1,38 @@ +! @@name: target_task_reduction.2.f90 +! @@type: F-free +! @@compilable: yes +! @@linkable: yes +! @@expect: success +! @@version: omp_5.0 +program target_task_reduction_ex2 + interface + subroutine device_compute(res) + !$omp declare target to(device_compute) + integer :: res + end subroutine device_compute + subroutine host_compute(res) + integer :: res + end subroutine host_compute + end interface + integer :: sum + sum = 0 + !$omp parallel sections reduction(task,+:sum) + !$omp section + !$omp target in_reduction(+:sum) nowait + call device_compute(sum) + !$omp end target + !$omp section + call host_compute(sum) + !$omp end parallel sections + print *, "sum = ", sum + !!OUTPUT: sum = 2 +end program + +subroutine device_compute(sum) + integer :: sum + sum = 1 +end subroutine +subroutine host_compute(sum) + integer :: sum + sum = 1 +end subroutine diff --git a/sources/Example_target_task_reduction.2b.c b/sources/Example_target_task_reduction.2b.c new file mode 100644 index 0000000..07054c7 --- /dev/null +++ b/sources/Example_target_task_reduction.2b.c @@ -0,0 +1,30 @@ +/* +* @@name: target_task_reduction.2b.c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: success +* @@version: omp_5.0 +*/ +#include +#pragma omp declare target to(device_compute) +extern void device_compute(int *); +extern void host_compute(int *); +int main() +{ + int sum = 0; + + #pragma omp parallel master reduction(task, +:sum) + { + #pragma omp target in_reduction(+:sum) nowait + device_compute(&sum); + + host_compute(&sum); + } + printf( "sum = %d\n", sum); + //OUTPUT: sum = 2 + return 0; +} + +void device_compute(int *sum){ *sum = 1; } +void host_compute(int *sum){ *sum = 1; } diff --git a/sources/Example_target_task_reduction.2b.f90 b/sources/Example_target_task_reduction.2b.f90 new file mode 100644 index 0000000..af0b6d5 --- /dev/null +++ b/sources/Example_target_task_reduction.2b.f90 @@ -0,0 +1,38 @@ +! @@name: target_task_reduction.2b.f90 +! @@type: F-free +! @@compilable: yes +! @@linkable: yes +! @@expect: success +! @@version: omp_5.0 +program target_task_reduction_ex2b + interface + subroutine device_compute(res) + !$omp declare target to(device_compute) + integer :: res + end subroutine device_compute + subroutine host_compute(res) + integer :: res + end subroutine host_compute + end interface + integer :: sum + sum = 0 + !$omp parallel master reduction(task,+:sum) + !$omp target in_reduction(+:sum) nowait + call device_compute(sum) + !$omp end target + call host_compute(sum) + !$omp end parallel sections + print *, "sum = ", sum + !!OUTPUT: sum = 2 +end program + + +subroutine device_compute(sum) + integer :: sum + sum = 1 +end subroutine +subroutine host_compute(sum) + integer :: sum + sum = 1 +end subroutine + diff --git a/sources/Example_target_unstructured_data.1.c b/sources/Example_target_unstructured_data.1.c index 190a7bd..cee1b33 100644 --- a/sources/Example_target_unstructured_data.1.c +++ b/sources/Example_target_unstructured_data.1.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success + * @@version: omp_4.5 */ #include typedef struct { diff --git a/sources/Example_target_unstructured_data.1.cpp b/sources/Example_target_unstructured_data.1.cpp index c894b17..3803aff 100644 --- a/sources/Example_target_unstructured_data.1.cpp +++ b/sources/Example_target_unstructured_data.1.cpp @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.5 */ class Matrix { diff --git a/sources/Example_target_unstructured_data.1.f90 b/sources/Example_target_unstructured_data.1.f90 index 24eca51..fff5ed2 100644 --- a/sources/Example_target_unstructured_data.1.f90 +++ b/sources/Example_target_unstructured_data.1.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.5 module example real(8), allocatable :: A(:) diff --git a/sources/Example_target_update.1.c b/sources/Example_target_update.1.c index f506b39..402e0e8 100644 --- a/sources/Example_target_update.1.c +++ b/sources/Example_target_update.1.c @@ -4,6 +4,8 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@expect: success +* @@version: omp_4.0 */ extern void init(float *, float *, int); extern void init_again(float *, float *, int); diff --git a/sources/Example_target_update.1.f90 b/sources/Example_target_update.1.f90 index 47e1e7e..11b9a3c 100644 --- a/sources/Example_target_update.1.f90 +++ b/sources/Example_target_update.1.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 subroutine vec_mult(p, v1, v2, N) real :: p(N), v1(N), v2(N) integer :: i diff --git a/sources/Example_target_update.2.c b/sources/Example_target_update.2.c index f106dee..70c44f6 100644 --- a/sources/Example_target_update.2.c +++ b/sources/Example_target_update.2.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ extern void init(float *, float *, int); extern int maybe_init_again(float *, int); diff --git a/sources/Example_target_update.2.f90 b/sources/Example_target_update.2.f90 index 07c55a3..42dd042 100644 --- a/sources/Example_target_update.2.f90 +++ b/sources/Example_target_update.2.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 subroutine vec_mult(p, v1, v2, N) interface logical function maybe_init_again (v1, N) diff --git a/sources/Example_task_dep.1.c b/sources/Example_task_dep.1.c index 426d141..66afe29 100644 --- a/sources/Example_task_dep.1.c +++ b/sources/Example_task_dep.1.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_4.0 */ #include int main() { diff --git a/sources/Example_task_dep.1.f90 b/sources/Example_task_dep.1.f90 index 356d553..9f745be 100644 --- a/sources/Example_task_dep.1.f90 +++ b/sources/Example_task_dep.1.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_4.0 program example integer :: x x = 1 diff --git a/sources/Example_task_dep.10.c b/sources/Example_task_dep.10.c index 32b9ce0..7f1d2f3 100644 --- a/sources/Example_task_dep.10.c +++ b/sources/Example_task_dep.10.c @@ -4,7 +4,10 @@ * @@compilable: no * @@linkable: no * @@expect: failure +* @@version: omp_5.0 */ +extern int longTaskA(), shortTaskB(); +extern int shortTaskAC(int,int), longTaskBC(int,int); void foo (void) { int a, b, c; diff --git a/sources/Example_task_dep.10.f90 b/sources/Example_task_dep.10.f90 index bf9bec6..c18f024 100644 --- a/sources/Example_task_dep.10.f90 +++ b/sources/Example_task_dep.10.f90 @@ -3,6 +3,7 @@ ! @@compilable: no ! @@linkable: no ! @@expect: failure +! @@version: omp_5.0 subroutine foo integer :: a,b,c c = 0 diff --git a/sources/Example_task_dep.11.c b/sources/Example_task_dep.11.c index 06f3c71..4e58d4b 100644 --- a/sources/Example_task_dep.11.c +++ b/sources/Example_task_dep.11.c @@ -1,11 +1,11 @@ /* * @@name: task_dep.11c * @@type: C -* @@compilable: yes, omp_5.0 +* @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_5.0 */ - #include void set_an_element(int *p, int val) { diff --git a/sources/Example_task_dep.11.f90 b/sources/Example_task_dep.11.f90 index 6f733d9..499a480 100644 --- a/sources/Example_task_dep.11.f90 +++ b/sources/Example_task_dep.11.f90 @@ -1,9 +1,9 @@ ! @@name: task_dep.11f90 ! @@type: F-free -! @@compilable: yes, omp_5.0 +! @@compilable: yes ! @@linkable: no ! @@expect: success - +! @@version: omp_5.0 subroutine set_an_element(e, val) implicit none integer :: e, val @@ -29,7 +29,7 @@ subroutine parallel_computation(n) !$omp single do i=1, n !$omp task depend(out: v(i)) - all set_an_element(v(i), i) + call set_an_element(v(i), i) !$omp end task enddo diff --git a/sources/Example_task_dep.12.c b/sources/Example_task_dep.12.c new file mode 100644 index 0000000..683de20 --- /dev/null +++ b/sources/Example_task_dep.12.c @@ -0,0 +1,29 @@ +/* +* @@name: task_dep.12c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: success +* @@version: omp_4.0 +*/ +#include +int main (int argc, char *argv[]) +{ + int x = 0; + #pragma omp parallel + #pragma omp single + { + /* first explicit task */ + #pragma omp task shared(x) depend(out: x) + x = 1; + + /* second explicit task */ + #pragma omp task shared(x) depend(inout: x) if(0) + x = 2; + + /* statement executed by parent implicit task + prints: x = 2 */ + printf("x = %d\n", x); + } + return 0; +} diff --git a/sources/Example_task_dep.12.f90 b/sources/Example_task_dep.12.f90 new file mode 100644 index 0000000..5fe4f7d --- /dev/null +++ b/sources/Example_task_dep.12.f90 @@ -0,0 +1,27 @@ +! @@name: task_dep.12f +! @@type: F-free +! @@compilable: yes +! @@linkable: yes +! @@expect: success +! @@version: omp_4.0 +program example + integer :: x + x = 0 + !$omp parallel + !$omp single + !... first explicit task + !$omp task shared(x) depend(out: x) + x = 1 + !$omp end task + + !... second explicit task + !$omp task shared(x) depend(inout: x) if(.false.) + x = 2 + !$omp end task + + !... statement executed by parent implicit task + ! prints: x = 2 + print*, "x = ", x + !$omp end single + !$omp end parallel +end program diff --git a/sources/Example_task_dep.2.c b/sources/Example_task_dep.2.c index 7bb082d..595039b 100644 --- a/sources/Example_task_dep.2.c +++ b/sources/Example_task_dep.2.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_4.0 */ #include int main() diff --git a/sources/Example_task_dep.2.f90 b/sources/Example_task_dep.2.f90 index 445785d..cb63c90 100644 --- a/sources/Example_task_dep.2.f90 +++ b/sources/Example_task_dep.2.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_4.0 program example integer :: x x = 1 diff --git a/sources/Example_task_dep.3.c b/sources/Example_task_dep.3.c index eb79f00..6c8c5d2 100644 --- a/sources/Example_task_dep.3.c +++ b/sources/Example_task_dep.3.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_4.0 */ #include int main() { diff --git a/sources/Example_task_dep.3.f90 b/sources/Example_task_dep.3.f90 index dea2b79..3a2f9f7 100644 --- a/sources/Example_task_dep.3.f90 +++ b/sources/Example_task_dep.3.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_4.0 program example integer :: x !$omp parallel diff --git a/sources/Example_task_dep.4.c b/sources/Example_task_dep.4.c index 32de6e5..6170439 100644 --- a/sources/Example_task_dep.4.c +++ b/sources/Example_task_dep.4.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_4.0 */ #include int main() { diff --git a/sources/Example_task_dep.4.f90 b/sources/Example_task_dep.4.f90 index 69512f3..ad0ac58 100644 --- a/sources/Example_task_dep.4.f90 +++ b/sources/Example_task_dep.4.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_4.0 program example integer :: x diff --git a/sources/Example_task_dep.5.c b/sources/Example_task_dep.5.c index 87417ad..5df1dc8 100644 --- a/sources/Example_task_dep.5.c +++ b/sources/Example_task_dep.5.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ // Assume BS divides N perfectly void matmul_depend(int N, int BS, float A[N][N], float B[N][N], float diff --git a/sources/Example_task_dep.5.f90 b/sources/Example_task_dep.5.f90 index c41e9f1..edd31d5 100644 --- a/sources/Example_task_dep.5.f90 +++ b/sources/Example_task_dep.5.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 ! Assume BS divides N perfectly subroutine matmul_depend (N, BS, A, B, C) implicit none diff --git a/sources/Example_task_dep.6.c b/sources/Example_task_dep.6.c index af2874f..ddbc208 100644 --- a/sources/Example_task_dep.6.c +++ b/sources/Example_task_dep.6.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_5.0 */ #include diff --git a/sources/Example_task_dep.6.f90 b/sources/Example_task_dep.6.f90 index 1bb8c71..51d1a02 100644 --- a/sources/Example_task_dep.6.f90 +++ b/sources/Example_task_dep.6.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_5.0 subroutine foo() diff --git a/sources/Example_task_dep.7.c b/sources/Example_task_dep.7.c index 1089785..df6e016 100644 --- a/sources/Example_task_dep.7.c +++ b/sources/Example_task_dep.7.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_5.0 */ #include diff --git a/sources/Example_task_dep.7.f90 b/sources/Example_task_dep.7.f90 index 3980b46..8d2cd8a 100644 --- a/sources/Example_task_dep.7.f90 +++ b/sources/Example_task_dep.7.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_5.0 subroutine foo() diff --git a/sources/Example_task_dep.8.c b/sources/Example_task_dep.8.c index 70b1527..7fbc459 100644 --- a/sources/Example_task_dep.8.c +++ b/sources/Example_task_dep.8.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_5.0 */ #include diff --git a/sources/Example_task_dep.8.f90 b/sources/Example_task_dep.8.f90 index 2987a05..01aa212 100644 --- a/sources/Example_task_dep.8.f90 +++ b/sources/Example_task_dep.8.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_5.0 subroutine foo() diff --git a/sources/Example_task_dep.9.c b/sources/Example_task_dep.9.c index 2ffde0c..35a99e5 100644 --- a/sources/Example_task_dep.9.c +++ b/sources/Example_task_dep.9.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_5.0 */ #include int main() diff --git a/sources/Example_task_dep.9.f90 b/sources/Example_task_dep.9.f90 index cdf4ce2..f9c312a 100644 --- a/sources/Example_task_dep.9.f90 +++ b/sources/Example_task_dep.9.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_5.0 program example integer :: a, b, c, d !$omp parallel diff --git a/sources/Example_task_priority.1.c b/sources/Example_task_priority.1.c index 40c262f..1a90441 100644 --- a/sources/Example_task_priority.1.c +++ b/sources/Example_task_priority.1.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.5 */ void compute_array (float *node, int M); diff --git a/sources/Example_task_priority.1.f90 b/sources/Example_task_priority.1.f90 index 08f2743..3423684 100644 --- a/sources/Example_task_priority.1.f90 +++ b/sources/Example_task_priority.1.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.5 subroutine compute_matrix(matrix, M, N) implicit none integer :: M, N diff --git a/sources/Example_task_reduction.1.c b/sources/Example_task_reduction.1.c index e46aa4c..00015c2 100644 --- a/sources/Example_task_reduction.1.c +++ b/sources/Example_task_reduction.1.c @@ -34,8 +34,7 @@ int linked_list_sum(node_t *p) } -int main(int argc, char *argv[]) -{ +int main(int argc, char *argv[]) { int i; // Create the root node. node_t* root = (node_t*) malloc(sizeof(node_t)); @@ -44,8 +43,7 @@ int main(int argc, char *argv[]) node_t* aux = root; // Create N-1 more nodes. - for(i=2;i<=N;++i) - { + for(i=2;i<=N;++i){ aux->next = (node_t*) malloc(sizeof(node_t)); aux = aux->next; aux->val = i; diff --git a/sources/Example_task_reduction.2.c b/sources/Example_task_reduction.2.c new file mode 100644 index 0000000..3afbe2c --- /dev/null +++ b/sources/Example_task_reduction.2.c @@ -0,0 +1,45 @@ +/* +* @@name: task_reduction.2.c +* @@type: C +* @@compilable: yes, omp_5.0 +* @@linkable: yes +* @@expect: success +* @@version: omp_5.0 +*/ +#include +int main(void){ + int N=100, M=10; + int i, x; + +// USE CASE 1 explicit-task reduction + parallel reduction clause + x=0; + #pragma omp parallel num_threads(M) reduction(task,+:x) + { + + x++; // implicit task reduction statement + + #pragma omp single + for(i=0;i void work() { diff --git a/sources/Example_tasking.10.f90 b/sources/Example_tasking.10.f90 index 39dae05..8270a97 100644 --- a/sources/Example_tasking.10.f90 +++ b/sources/Example_tasking.10.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_3.0 module example include 'omp_lib.h' integer (kind=omp_lock_kind) lock diff --git a/sources/Example_tasking.11.c b/sources/Example_tasking.11.c index f711073..9c49ff3 100644 --- a/sources/Example_tasking.11.c +++ b/sources/Example_tasking.11.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_3.1 */ #include void foo ( ) diff --git a/sources/Example_tasking.11.f90 b/sources/Example_tasking.11.f90 index 3db2c63..17d492d 100644 --- a/sources/Example_tasking.11.f90 +++ b/sources/Example_tasking.11.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_3.1 subroutine foo() integer :: x x = 2 diff --git a/sources/Example_tasking.12.c b/sources/Example_tasking.12.c index 44d9e69..1e4e10e 100644 --- a/sources/Example_tasking.12.c +++ b/sources/Example_tasking.12.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: rt-error +* @@version: omp_3.1 */ #include void foo ( ) diff --git a/sources/Example_tasking.12.f90 b/sources/Example_tasking.12.f90 index 955b116..5c9fa01 100644 --- a/sources/Example_tasking.12.f90 +++ b/sources/Example_tasking.12.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: rt-error +! @@version: omp_3.1 subroutine foo() integer :: x x = 2 diff --git a/sources/Example_tasking.13.c b/sources/Example_tasking.13.c index 27f6f6d..e8dff7e 100644 --- a/sources/Example_tasking.13.c +++ b/sources/Example_tasking.13.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_3.1 */ #include #include diff --git a/sources/Example_tasking.13.f90 b/sources/Example_tasking.13.f90 index d9426b2..dac54a8 100644 --- a/sources/Example_tasking.13.f90 +++ b/sources/Example_tasking.13.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_3.1 recursive subroutine bin_search(pos, n, state) use omp_lib integer :: pos, n diff --git a/sources/Example_tasking.14.c b/sources/Example_tasking.14.c index 1006c55..2403b2a 100644 --- a/sources/Example_tasking.14.c +++ b/sources/Example_tasking.14.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_3.1 */ void bar(void); diff --git a/sources/Example_tasking.14.f90 b/sources/Example_tasking.14.f90 index 8cfee6f..15a61e9 100644 --- a/sources/Example_tasking.14.f90 +++ b/sources/Example_tasking.14.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_3.1 subroutine foo() integer i !$omp task if(.FALSE.) ! This task is undeferred diff --git a/sources/Example_tasking.15.c b/sources/Example_tasking.15.c index 0191c91..a0359d4 100644 --- a/sources/Example_tasking.15.c +++ b/sources/Example_tasking.15.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_4.0 */ #include int main() diff --git a/sources/Example_tasking.15.f90 b/sources/Example_tasking.15.f90 index 4fed17c..f429279 100644 --- a/sources/Example_tasking.15.f90 +++ b/sources/Example_tasking.15.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_4.0 program example integer :: x x = 1 diff --git a/sources/Example_tasking.16.c b/sources/Example_tasking.16.c index 32b8443..5873fb2 100644 --- a/sources/Example_tasking.16.c +++ b/sources/Example_tasking.16.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_4.0 */ #include int main() diff --git a/sources/Example_tasking.16.f90 b/sources/Example_tasking.16.f90 index 01f41b0..4903d82 100644 --- a/sources/Example_tasking.16.f90 +++ b/sources/Example_tasking.16.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_4.0 program example integer :: x x = 1 diff --git a/sources/Example_tasking.17.c b/sources/Example_tasking.17.c index 1df0ac2..2e2e47b 100644 --- a/sources/Example_tasking.17.c +++ b/sources/Example_tasking.17.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_4.0 */ #include int main() diff --git a/sources/Example_tasking.17.f90 b/sources/Example_tasking.17.f90 index e82cb57..55763fd 100644 --- a/sources/Example_tasking.17.f90 +++ b/sources/Example_tasking.17.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_4.0 program example integer :: x !$omp parallel diff --git a/sources/Example_tasking.18.c b/sources/Example_tasking.18.c index a1eb0a1..ba757e7 100644 --- a/sources/Example_tasking.18.c +++ b/sources/Example_tasking.18.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_4.0 */ #include int main() diff --git a/sources/Example_tasking.18.f90 b/sources/Example_tasking.18.f90 index 42ee105..796982e 100644 --- a/sources/Example_tasking.18.f90 +++ b/sources/Example_tasking.18.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_4.0 program example integer :: x x = 1 diff --git a/sources/Example_tasking.19.c b/sources/Example_tasking.19.c index f7cfbe8..8f4d9b1 100644 --- a/sources/Example_tasking.19.c +++ b/sources/Example_tasking.19.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ // Assume BS divides N perfectly void matmul_depend(int N, int BS, float A[N][N], float B[N][N], float diff --git a/sources/Example_tasking.19.f90 b/sources/Example_tasking.19.f90 index 44dc306..1afa1ea 100644 --- a/sources/Example_tasking.19.f90 +++ b/sources/Example_tasking.19.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 subroutine matmul_depend (N, BS, A, B, C) integer :: N, BS, BM real, dimension(N, N) :: A, B, C diff --git a/sources/Example_tasking.2.c b/sources/Example_tasking.2.c index e543ada..b5c32ce 100644 --- a/sources/Example_tasking.2.c +++ b/sources/Example_tasking.2.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_3.0 */ struct node { struct node *left; diff --git a/sources/Example_tasking.2.f90 b/sources/Example_tasking.2.f90 index 5d54f46..e80f946 100644 --- a/sources/Example_tasking.2.f90 +++ b/sources/Example_tasking.2.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_3.0 RECURSIVE SUBROUTINE traverse ( P ) TYPE Node TYPE(Node), POINTER :: left, right diff --git a/sources/Example_tasking.3.c b/sources/Example_tasking.3.c index fe30eab..733cd8c 100644 --- a/sources/Example_tasking.3.c +++ b/sources/Example_tasking.3.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_3.0 */ typedef struct node node; diff --git a/sources/Example_tasking.3.f90 b/sources/Example_tasking.3.f90 index 98d6615..bab3183 100644 --- a/sources/Example_tasking.3.f90 +++ b/sources/Example_tasking.3.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_3.0 MODULE LIST TYPE NODE diff --git a/sources/Example_tasking.4.c b/sources/Example_tasking.4.c index a7b1fb6..f900bec 100644 --- a/sources/Example_tasking.4.c +++ b/sources/Example_tasking.4.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_3.0 */ int fib(int n) { int i, j; diff --git a/sources/Example_tasking.4.f b/sources/Example_tasking.4.f index 5d31316..edfd66a 100644 --- a/sources/Example_tasking.4.f +++ b/sources/Example_tasking.4.f @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_3.0 RECURSIVE INTEGER FUNCTION fib(n) RESULT(res) INTEGER n, i, j IF ( n .LT. 2) THEN diff --git a/sources/Example_tasking.5.c b/sources/Example_tasking.5.c index 7d9c27f..72485bd 100644 --- a/sources/Example_tasking.5.c +++ b/sources/Example_tasking.5.c @@ -4,12 +4,14 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_3.0 */ #define LARGE_NUMBER 10000000 double item[LARGE_NUMBER]; extern void process(double); -int main() { +int main() +{ #pragma omp parallel { #pragma omp single diff --git a/sources/Example_tasking.5.f b/sources/Example_tasking.5.f index f3512da..ed7a2a5 100644 --- a/sources/Example_tasking.5.f +++ b/sources/Example_tasking.5.f @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_3.0 real*8 item(10000000) integer i @@ -16,4 +17,5 @@ end do !$omp end single !$omp end parallel + end diff --git a/sources/Example_tasking.6.c b/sources/Example_tasking.6.c index e15fe0d..397b59e 100644 --- a/sources/Example_tasking.6.c +++ b/sources/Example_tasking.6.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_3.0 */ #define LARGE_NUMBER 10000000 double item[LARGE_NUMBER]; diff --git a/sources/Example_tasking.6.f b/sources/Example_tasking.6.f index 403f4c9..e65dac5 100644 --- a/sources/Example_tasking.6.f +++ b/sources/Example_tasking.6.f @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_3.0 real*8 item(10000000) !$omp parallel !$omp single diff --git a/sources/Example_tasking.7.c b/sources/Example_tasking.7.c index f97b325..c1dfbd0 100644 --- a/sources/Example_tasking.7.c +++ b/sources/Example_tasking.7.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_3.0 */ int tp; diff --git a/sources/Example_tasking.7.f b/sources/Example_tasking.7.f index 3b612cb..2a8b3b9 100644 --- a/sources/Example_tasking.7.f +++ b/sources/Example_tasking.7.f @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_3.0 module example integer tp !$omp threadprivate(tp) diff --git a/sources/Example_tasking.8.c b/sources/Example_tasking.8.c index 5cf6a36..a1b76ac 100644 --- a/sources/Example_tasking.8.c +++ b/sources/Example_tasking.8.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_3.0 */ int tp; diff --git a/sources/Example_tasking.8.f b/sources/Example_tasking.8.f index f43d3c2..02d837d 100644 --- a/sources/Example_tasking.8.f +++ b/sources/Example_tasking.8.f @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_3.0 module example integer tp !$omp threadprivate(tp) diff --git a/sources/Example_tasking.9.c b/sources/Example_tasking.9.c index 0c12097..68b7c52 100644 --- a/sources/Example_tasking.9.c +++ b/sources/Example_tasking.9.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: rt-error +* @@version: omp_3.0 */ void work() { diff --git a/sources/Example_tasking.9.f b/sources/Example_tasking.9.f index 9726ee6..857b351 100644 --- a/sources/Example_tasking.9.f +++ b/sources/Example_tasking.9.f @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: rt-error +! @@version: omp_3.0 module example contains subroutine work diff --git a/sources/Example_taskloop.1.c b/sources/Example_taskloop.1.c index ed76212..355b0b6 100644 --- a/sources/Example_taskloop.1.c +++ b/sources/Example_taskloop.1.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.5 */ void long_running_task(void); void loop_body(int i, int j); diff --git a/sources/Example_taskloop.1.f90 b/sources/Example_taskloop.1.f90 index 5f23b20..ff1fb5e 100644 --- a/sources/Example_taskloop.1.f90 +++ b/sources/Example_taskloop.1.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.5 subroutine parallel_work integer i integer j diff --git a/sources/Example_taskloop.2.c b/sources/Example_taskloop.2.c index e135ef7..11f3c20 100644 --- a/sources/Example_taskloop.2.c +++ b/sources/Example_taskloop.2.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.5 */ #include diff --git a/sources/Example_taskloop.2.f90 b/sources/Example_taskloop.2.f90 index 7ab507b..15cd08e 100644 --- a/sources/Example_taskloop.2.f90 +++ b/sources/Example_taskloop.2.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.5 subroutine parallel_work implicit none integer :: x1, x2 diff --git a/sources/Example_taskloop_reduction.1.c b/sources/Example_taskloop_reduction.1.c index c592b27..77b8a8d 100644 --- a/sources/Example_taskloop_reduction.1.c +++ b/sources/Example_taskloop_reduction.1.c @@ -1,9 +1,10 @@ /* * @@name: taskloop_reduction.1.c * @@type: C -* @@compilable: yes, omp_5.0 +* @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_5.0 */ #include diff --git a/sources/Example_taskloop_reduction.1.f90 b/sources/Example_taskloop_reduction.1.f90 index 5346330..632a08e 100644 --- a/sources/Example_taskloop_reduction.1.f90 +++ b/sources/Example_taskloop_reduction.1.f90 @@ -1,8 +1,10 @@ ! @@name: taskloop_reduction.1.f90 ! @@type: F-free -! @@compilable: yes, omp_5.0 +! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_5.0 + function array_sum(n, v) result(res) implicit none integer :: n, v(n), res diff --git a/sources/Example_taskloop_reduction.2.c b/sources/Example_taskloop_reduction.2.c index 19f8bb8..c901f42 100644 --- a/sources/Example_taskloop_reduction.2.c +++ b/sources/Example_taskloop_reduction.2.c @@ -1,9 +1,10 @@ /* * @@name: taskloop_reduction.2.c * @@type: C -* @@compilable: yes, omp_5.0 +* @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_5.0 */ #include diff --git a/sources/Example_taskloop_reduction.2.f90 b/sources/Example_taskloop_reduction.2.f90 index b2ce6b2..6fb32d9 100644 --- a/sources/Example_taskloop_reduction.2.f90 +++ b/sources/Example_taskloop_reduction.2.f90 @@ -1,8 +1,10 @@ ! @@name: taskloop_reduction.2.f90 ! @@type: F-free -! @@compilable: yes, omp_5.0 +! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_5.0 + function array_sum(n, v) result(res) implicit none integer :: n, v(n), res diff --git a/sources/Example_taskloop_simd_reduction.1.c b/sources/Example_taskloop_simd_reduction.1.c index 1708239..55b0ec8 100644 --- a/sources/Example_taskloop_simd_reduction.1.c +++ b/sources/Example_taskloop_simd_reduction.1.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_5.0 */ #include diff --git a/sources/Example_taskloop_simd_reduction.1.f90 b/sources/Example_taskloop_simd_reduction.1.f90 index f3138b0..52ab12d 100644 --- a/sources/Example_taskloop_simd_reduction.1.f90 +++ b/sources/Example_taskloop_simd_reduction.1.f90 @@ -1,8 +1,9 @@ ! @@name: taskloop_simd_reduction.1f90 ! @@type: F-free -! @@compilable: yes, omp_5.0 +! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_5.0 program main diff --git a/sources/Example_taskyield.1.c b/sources/Example_taskyield.1.c index b4eff48..88a7fc6 100644 --- a/sources/Example_taskyield.1.c +++ b/sources/Example_taskyield.1.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_3.1 */ #include diff --git a/sources/Example_taskyield.1.f90 b/sources/Example_taskyield.1.f90 index c5523dc..623a639 100644 --- a/sources/Example_taskyield.1.f90 +++ b/sources/Example_taskyield.1.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_3.1 subroutine foo ( lock, n ) use omp_lib integer (kind=omp_lock_kind) :: lock diff --git a/sources/Example_teams.1.c b/sources/Example_teams.1.c index bfcee5e..0af405f 100644 --- a/sources/Example_teams.1.c +++ b/sources/Example_teams.1.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ #include #include diff --git a/sources/Example_teams.1.f90 b/sources/Example_teams.1.f90 index 5318263..aae1514 100644 --- a/sources/Example_teams.1.f90 +++ b/sources/Example_teams.1.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 function dotprod(B,C,N) result(sum) use omp_lib, ONLY : omp_get_num_teams, omp_get_team_num real :: B(N), C(N), sum,sum0, sum1 diff --git a/sources/Example_teams.2.c b/sources/Example_teams.2.c index 6ec1a45..20822bb 100644 --- a/sources/Example_teams.2.c +++ b/sources/Example_teams.2.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ #define min(x, y) (((x) < (y)) ? (x) : (y)) diff --git a/sources/Example_teams.2.f90 b/sources/Example_teams.2.f90 index ec9eeee..8da3a69 100644 --- a/sources/Example_teams.2.f90 +++ b/sources/Example_teams.2.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 function dotprod(B,C,N, block_size, num_teams, block_threads) result(sum) implicit none real :: B(N), C(N), sum diff --git a/sources/Example_teams.3.c b/sources/Example_teams.3.c index f073020..4b58c9a 100644 --- a/sources/Example_teams.3.c +++ b/sources/Example_teams.3.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.5 */ float dotprod(float B[], float C[], int N) { diff --git a/sources/Example_teams.3.f90 b/sources/Example_teams.3.f90 index 4f182b6..584a0bf 100644 --- a/sources/Example_teams.3.f90 +++ b/sources/Example_teams.3.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.5 function dotprod(B,C,N) result(sum) real :: B(N), C(N), sum integer :: N, i diff --git a/sources/Example_teams.4.c b/sources/Example_teams.4.c index 236c66c..c9d9053 100644 --- a/sources/Example_teams.4.c +++ b/sources/Example_teams.4.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ #define N 1024*1024 float dotprod(float B[], float C[]) diff --git a/sources/Example_teams.4.f90 b/sources/Example_teams.4.f90 index 6cd0f15..636bbf1 100644 --- a/sources/Example_teams.4.f90 +++ b/sources/Example_teams.4.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 module arrays integer,parameter :: N=1024*1024 real :: B(N), C(N) diff --git a/sources/Example_teams.5.c b/sources/Example_teams.5.c index e82da5c..5310bcd 100644 --- a/sources/Example_teams.5.c +++ b/sources/Example_teams.5.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ extern void init(float *, float *, int); extern void output(float *, int); diff --git a/sources/Example_teams.5.f90 b/sources/Example_teams.5.f90 index 56a6047..16e9d9f 100644 --- a/sources/Example_teams.5.f90 +++ b/sources/Example_teams.5.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 subroutine vec_mult(p, v1, v2, N) real :: p(N), v1(N), v2(N) integer :: i diff --git a/sources/Example_teams.6.c b/sources/Example_teams.6.c index 621c21e..6018b61 100644 --- a/sources/Example_teams.6.c +++ b/sources/Example_teams.6.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ extern void init(float *, float *, int); extern void output(float *, int); diff --git a/sources/Example_teams.6.f90 b/sources/Example_teams.6.f90 index e199afd..5fb0b27 100644 --- a/sources/Example_teams.6.f90 +++ b/sources/Example_teams.6.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 subroutine vec_mult(p, v1, v2, N) real :: p(N), v1(N), v2(N) integer :: i diff --git a/sources/Example_udr.1.c b/sources/Example_udr.1.c index 16d0fc8..cff8062 100644 --- a/sources/Example_udr.1.c +++ b/sources/Example_udr.1.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ #include #include diff --git a/sources/Example_udr.1.f90 b/sources/Example_udr.1.f90 index 1507f38..1787c13 100644 --- a/sources/Example_udr.1.f90 +++ b/sources/Example_udr.1.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 module data_type type :: point diff --git a/sources/Example_udr.2.c b/sources/Example_udr.2.c index 067b161..8dcc33b 100644 --- a/sources/Example_udr.2.c +++ b/sources/Example_udr.2.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ #include #include diff --git a/sources/Example_udr.2.f90 b/sources/Example_udr.2.f90 index 461ba8d..e75cb86 100644 --- a/sources/Example_udr.2.f90 +++ b/sources/Example_udr.2.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: no ! @@expect: success +! @@version: omp_4.0 module data_type type :: point diff --git a/sources/Example_udr.3.c b/sources/Example_udr.3.c index 07af689..9801686 100644 --- a/sources/Example_udr.3.c +++ b/sources/Example_udr.3.c @@ -4,6 +4,7 @@ * @@compilable: yes * @@linkable: yes * @@expect: success +* @@version: omp_4.0 */ #include @@ -14,12 +15,9 @@ struct mx_s { int index; }; - /* prototype functions for combiner and initializer in the declare reduction */ - void mx_combine(struct mx_s *out, struct mx_s *in); - void mx_init(struct mx_s *priv, struct mx_s *orig); #pragma omp declare reduction(maxloc: struct mx_s: \ @@ -34,14 +32,12 @@ void mx_combine(struct mx_s *out, struct mx_s *in) } } - void mx_init(struct mx_s *priv, struct mx_s *orig) { priv->value = orig->value; priv->index = orig->index; } - int main(void) { struct mx_s mx; diff --git a/sources/Example_udr.3.f90 b/sources/Example_udr.3.f90 index 581444a..a050071 100644 --- a/sources/Example_udr.3.f90 +++ b/sources/Example_udr.3.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_4.0 program max_loc implicit none diff --git a/sources/Example_udr.4.f90 b/sources/Example_udr.4.f90 index 2444ae6..48f216e 100644 --- a/sources/Example_udr.4.f90 +++ b/sources/Example_udr.4.f90 @@ -3,6 +3,7 @@ ! @@compilable: yes ! @@linkable: yes ! @@expect: success +! @@version: omp_4.0 module data_red ! Declare data type. type dt diff --git a/sources/Example_udr.5.cpp b/sources/Example_udr.5.cpp index 9695f22..08f89ba 100644 --- a/sources/Example_udr.5.cpp +++ b/sources/Example_udr.5.cpp @@ -4,6 +4,7 @@ * @@compilable: no * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ class V { float *p; diff --git a/sources/Example_udr.6.cpp b/sources/Example_udr.6.cpp index cba1a03..7becf11 100644 --- a/sources/Example_udr.6.cpp +++ b/sources/Example_udr.6.cpp @@ -4,6 +4,7 @@ * @@compilable: no * @@linkable: no * @@expect: success +* @@version: omp_4.0 */ #include #include diff --git a/sources/test_code_one b/sources/test_code_one new file mode 100644 index 0000000..2fb738b --- /dev/null +++ b/sources/test_code_one @@ -0,0 +1,15 @@ +set opts="" +if ( $aopt == 1 ) then + set opts=" $copt" +else if ( $aopt != 0) then + set sstr=omp.h + if ( "$1" == "f" || "$1" == "f90" ) set sstr="use omp_lib|omp_lib.h" + egrep "$sstr" $f >& /dev/null + if ( $status == 0 ) set opts=" $copt" +endif +echo "### ${f}$opts" | tee -a $logf +$comp -c$opts $f >>& $logf +if ( $status != 0 ) then + echo ">>> $f FAILED" | tee -a $logf + @ cntfail++; +endif diff --git a/sources/test_codes b/sources/test_codes new file mode 100755 index 0000000..e880f71 --- /dev/null +++ b/sources/test_codes @@ -0,0 +1,55 @@ +#!/bin/csh + +set aopt=2 #default(auto), 0:no-copt, 1:with-copt +if ( "$1" == "no-copt" || "$1" == "0" ) then + set aopt=0 +else if ( "$1" == "with-copt"i || "$1" == "1" ) then + set aopt=1 +else if ( "$1" == "auto" || "$1" == "2" ) then + set aopt=2 +else if ( "$1" == "-h" ) then + echo "usage: test_codes [no-copt | with-copt | auto]" + exit +endif + +set copt="-fopenmp" +set cntc=0 +set cntcpp=0 +set cntf=0 +set cntffree=0 +set cntfail=0 +set logf=test_codes.log + +set comp=gcc +foreach f (*.c) + @ cntc++; + source test_code_one c +end + +set comp=g++ +foreach f (*.cpp) + @ cntcpp++; + source test_code_one cpp +end + +set comp=gfortran +foreach f (*.f) + @ cntf++; + source test_code_one f +end + +set comp=gfortran +foreach f (*.f90) + @ cntffree++; + source test_code_one f90 +end + +echo "" | tee -a $logf +echo "Total number of C examples: $cntc" | tee -a $logf +echo "Total number of C++ examples: $cntcpp" | tee -a $logf +echo "Total number of F-fixed examples: $cntf" | tee -a $logf +echo "Total number of F-free examples: $cntffree" | tee -a $logf +echo "Total number of failed examples: $cntfail" | tee -a $logf + +\rm -f *.o *.mod + diff --git a/util/latexdiff/VERSION b/util/latexdiff/VERSION new file mode 100644 index 0000000..7a177ed --- /dev/null +++ b/util/latexdiff/VERSION @@ -0,0 +1,4 @@ +The current version of latexdiff comes from: +git clone -b openmp-rebased git@github.com:jprotze/latexdiff.git + +The commit is 1ed71be6fb71927473bd9468ce42f42e1431b5ab \ No newline at end of file diff --git a/util/latexdiff/latexdiff b/util/latexdiff/latexdiff new file mode 100755 index 0000000..049e870 --- /dev/null +++ b/util/latexdiff/latexdiff @@ -0,0 +1,4951 @@ +#!/usr/bin/env perl +##!/usr/bin/perl -w +# latexdiff - differences two latex files on the word level +# and produces a latex file with the differences marked up. +# +# Copyright (C) 2004-16 F J Tilmann (tilmann@gfz-potsdam.de) +# +# Repository/issue tracker: https://github.com/ftilmann/latexdiff +# CTAN page: http://www.ctan.org/pkg/latexdiff +# +# This program is free software: you can redistribute it and/or modify +# it under the terms of the GNU General Public License as published by +# the Free Software Foundation, either version 3 of the License, or +# (at your option) any later version. +# +# This program is distributed in the hope that it will be useful, +# but WITHOUT ANY WARRANTY; without even the implied warranty of +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +# GNU General Public License for more details. +# You should have received a copy of the GNU General Public License +# along with this program. If not, see . +# +# Detailed usage information at the end of the file +# +# +# Version 1.2.2a: +# - improved pattern matching: now allows nested angular brackets, and is no longer confused by escaped curly braces +# - improved pattern matching in COARSE mode: occasionally, the closing bracket or some other elements would be matched in an 'unnatural' way due to another sequence being more minimal in the computational sense, sometimes even causing errors due to tokens moving in or out of the scope of math environments. This is now discouraged by adding internal \DIFANCHOR commands (which are removed again in post-processing) (fixes issues reported via email by li_ruomeng . +# - verbatim and lstlisting environments are marked-up with line-by-line in a similar style to non-verbatim text (requires the listing package to be installed) +# (see new configuration variable VERBATIMLINEENV) +# - --flatten: now supports \verbatiminput and \lstlistinput +# - --flatten: if file is not found, do not fail, simply warn and leave command unexpanded (inspired by issue #112). Don't warn if file name contains #[0-9] as it is then most likely an argument within a command definition rather than an actual file (applies to \input, \subfile, \include commands) +# - added to textcmds: \intertext +# Bug fixes: +# - pattern matching of \verb and \lstinline commands had an error which meant they would trigger on commands beginning with \verb. +# +# Version 1.2.1 (22 June 2017) +# - add "DeclareOldFontCommand" to styles using \bf or \sf old style font commands (fixies issue #92 ) +# - improved markup: process lstinline commands in listings package correctly +# for styles using colour, \verb and \lstinline arguments are marked up with colour (blue for added, red for deleted) +# - bug fix: protecting inline math expressions for mbox did not work as intended (see stack exchange question: http://tex.stackexchange.com/questions/359412/compiling-the-latexdiff-when-adding-a-subscript-before-a-pmatrix-environment-cau) +# - bug fix: when deleted \item commands are followed immediately by unsafe commands, they were not restored properly +# (thanks to J. Protze for pull request) (pull request #89) +# - treat lstlisting and comment as equivalent to verbatim environment +# make environments that are treated like verbatim environments configurable (config variable VERBATIMENV) +# treat lstinlne as equivalent to verb command +# partially addresses issue #38 +# - refactoring: set default configuration variables in a hash, and those that correspond to lists +# - feature: option --add-to-config used to amend configuration variables, which are regex pattern lists +# - bug fix: deleted figures when endfloat package is activated +# - bug fix: alignat environment now always processed correctly (fix issues #65) +# - bug fix: avoid processing of commands as potential files in routine init_regex_arr (fix issue #70 ) +# - minimal feature enhancement: treat '@' as allowed character in commands (strictly speaking requires prior \makeatletter statement, but always assuming it to be +# @ a letter if it is part of a command name will usually lead to the correct behaviour (see http://tex.stackexchange.com/questions/346651/latexdiff-and-let) +# - new feature/bug fix: --flatten option \endinput in included files now respected but only if \endinput stands right at the beginning of the line (issue #77) +# - bug fix: flatten would incorrectly attempt to process commented out \include commands (from discussion in issue #77 ) +# - introduce an invisible space (\hspace{0pt} after \mbox{..} auxiliary commands (not in math mode), to allow line breaks between added and deleted citations (change should not cause adverse behaviour otherwise) +# +# Version 1.2.0: +# - highlight new and deleted figures +# - bug fix in title mark-up. Previously deleted commands in title (such as \title, \author or \date) were marked up erroneously +# - (minor) bug fixes in new 1.1.1 features: disabled label was commented out twice, additional spaces were introduced before list environment begin and end commands +# - depracation fix: left brace in RegEx now needs to be escaped +# - add type PDFCOMMENT based on issue #49 submitted by github user peci1 (Martin Pecka) +# - make utf8 the default encoding +# +# Version 1.1.1 +# - patch mhchem: allow ce in equations +# - flatten now also expands \input etc. in the preamble (but not \usepackage!) +# - Better support for Japanese ( contributed by github user kshramt ) +# - prevent duplicated verbatim hashes (patch contributed by github user therussianjig, issue #36) +# - disable deleted label commands (fixes issue #31) +# - introduce post-processing to reinstate most deleted environments and all needed item commands (fixes issue #1) +# +# Version 1.1.0 +# - treat diacritics (\",\', etc) as safe commands +# - treat \_ and \& correctly as safe commands, even if used without spacing to the next word +# - Add a BOLD markup type that sets added text in bold face (Contribution by Victor Zabalza via pull request ) +# - add append-mboxsafecmd list option to be able to specify special safe commands which need to be surrounded by mbox to avoid breaking (mostly this is needed with ulem package) +# - support for siunitx and cleveref packages: protect \SI command in siunitx package and \cref,\Cref{range}{*} in cleveref packages (thanks to Stefan Pinnow for testing) +# - experimental support for chemformula, mhchem packages: define \ch and \ce in packages as safe (but not \ch,\cee in equation array environments) - these unfortunately will not be marked up (thanks to Stefan Pinnow for testing) +# - bug fix: packages identified correctly even if \usepackage command options extend over several lines (previously \usepackage command needed to be fully contained in one line) +# - new subtype ONLYCHANGEDPAGE outputs only changed pages (might not work well for floating material) +# - new subtype ZLABEL operates similarly to LABEL but uses absolute page numbers (needs zref package) +# - undocumented option --debug/--nodebug to override default setting for debug mode (Default: 0 for release version, 1: for development version +# +# Version 1.0.4 +# - introduce list UNSAFEMATHCMD, which holds list of commands which cannot be marked up with \DIFadd or \DIFdel commands (only relevant for WHOLE and COARSE math markup modes) +# - new subtype LABEL which gives each change a label. This can later be used to only display pages where changes +# have been made (instructions for that are put as comments into the diff'ed file) inspired by answer on http://tex.stackexchange.com/questions/166049/invisible-markers-in-pdfs-using-pdflatex +# - Configuration variables take into accout some commands from additional packages: +# tikzpicture environment now treated as PICTUREENV, and \smallmatrix in ARRENV (amsmath) +# - --flatten: support for \subfile command (subfiles package) (in response to http://tex.stackexchange.com/questions/167620/latexdiff-with-subfiles ) +# - --flatten: \bibliography commands expand if corresponding bbl file present +# - angled bracket optional commands now parsed correctly (patch #3570) submitted by Dave Kleinschmidt (thanks) +# - \RequirePackage now treated as synonym of \usepackage with respect to setting packages +# - special rules for apacite package (redefine citation commands) +# - recognise /dev/null as 'file-like' arguments for --preamble and --config options +# - fix units package incompatibility with ulem for text maths statements $ ..$ (thanks to Stuart Prescott for reporting this) +# - amsmath environment cases treated correctly (Bug fix #19029) (thanks to Jalar) +# - {,} in comments no longer confuse latexdiff (Bug fix #19146) +# - \% in one-letter sub/Superscripts was not converted correctly +# +# Version 1.0.3 +# - fix bug in add_safe_commands that made latexdiff hang on DeclareMathOperator +# command in preamble +# - \(..\) inline math expressions were not parsed correctly, if they contained a linebreak +# - applied patch contributed by tomflannaghan via Berlios: [ Patch #3431 ] Adds correct handling of \left< and \right> +# - \$ is treated correctly as a literal dollar sign (thanks to Reed Cartwright and Joshua Miller for reporting this bug +# and sketching out the solution) +# - \^ and \_ are correctly interpreted as accent and underlined space, respectively, not as superscript of subscript +# (thanks to Wail Yahyaoui for pointing out this bug) +# +# Version 1.0.1 - treat \big,\bigg etc. equivalently to \left and +# \right - include starred version in MATHENV - apply +# - flatten recursively and --flatten expansion is now +# aware of comments (thanks to Tim Connors for patch) +# - Change to post-processing for more reliability for +# deleted math environments +# - On linux systems, recognise and remove DOS style newlines +# - Provide markup for some special preamble commands (\title, +# \author,\date, +# - configurable by setting context2cmd +# - for styles using ulem package, remove \emph and \text.. from list of +# safe commands in order to allow linebreaks within the +# highlighted sections. +# - for ulem style, now show citations by enclosing them in \mbox commands. +# This unfortunately implies linebreaks within citations no longer function, +# so this functionality can be turned off (Option --disable-citation-markup). +# With --enable-citation-markup, the mbox markup is forced for other styles) +# - new substyle COLOR. This is particularly useful for marking up citations +# and some special post-processing is implemented to retain cite +# commands in deleted blocks. +# - four different levels of math-markup +# - Option --driver for choosing driver for modes employing changebar package +# - accept \\* as valid command (and other commands of form \.*). Also accept +# \ (backslashed newline) +# - some typo fixes, include commands defined in preamble as safe commands +# (Sebastian Gouezel) +# - include compared filenames as comments as line 2 and 3 of +# the preamble (can be modified with option --label, and suppressed with +# --no-label), option --visible-label to show files in generated pdf or dvi +# at the beginning of main document +# +# Version 0.5 A number of minor improvements based on feedback +# Deleted blocks are now shown before added blocks +# Package specific processing +# +# Version 0.43 unreleased typo in list of styles at the end +# Add protect to all \cbstart, \cbend commands +# More robust substitution of deleted math commands +# +# Version 0.42 November 06 Bug fixes only +# +# Version 0.4 March 06 option for fast differencing using UNIX diff command, several minor bug fixes (\par bug, improved highlighting of textcmds) +# +# Version 0.3 August 05 improved parsing of displayed math, --allow-spaces +# option, several minor bug fixes +# +# Version 0.25 October 04 Fix bug with deleted equations, add math mode commands to safecmd, add | to allowed interpunctuation signs +# Version 0.2 September 04 extension to utf-8 and variable encodings +# Version 0.1 August 04 First public release + +use Algorithm::Diff qw(traverse_sequences); + +use Getopt::Long ; +use strict ; +use warnings; +use utf8 ; + +my ($algodiffversion)=split(/ /,$Algorithm::Diff::VERSION); + + +my ($versionstring)=< 3, # minimum number of tokens to form an independent block + # shorter identical blocks will be merged to the previous word + SCALEDELGRAPHICS => 0.5, # factor with which deleted figures will be scaled down (i.e. 0.5 implies they are shown at half linear size) + # this is only used for --graphics-markup=BOTH option + FLOATENV => undef , # Environments in which FL variants of defined commands are used + PICTUREENV => undef , # Environments in which all change markup is removed + MATHENV => undef , # Environments turning on display math mode (code also knows about \[ and \]) + MATHREPL => 'displaymath', # Environment introducing deleted maths blocks + MATHARRENV => undef , # Environments turning on eqnarray math mode + MATHARRREPL => 'eqnarray*', # Environment introducing deleted maths blocks + ARRENV => undef , # Environments making arrays in math mode. The underlining style does not cope well with those - as a result in-text math environments are surrounded by \mbox{ } if any of these commands is used in an inline math block + COUNTERCMD => undef, + # COUNTERCMD textcmds which are associated with a counter + # If any of these commands occur in a deleted block + # they will be succeeded by an \addtocounter{...}{-1} + # for the associated counter such that the overall numbers + # should be the same as in the new file + LISTENV => undef , # list making environments - they will generally be kept + VERBATIMENV => undef, # Environments whose content should be treated as verbatim text and not be touched + VERBATIMLINEENV => undef, # Environments whose content should be treated as verbatim text and processed in line diff mode + LSTINLINEENV => undef,# Environments whose content should be treated as lstinline text and processed as lstinline + CUSTOMDIFCMD => undef,# Custom dif command. Is defined in the document as a \DELcommand and \ADDcommand version to be replaced by the diff + ITEMCMD => 'item' # command marking item in a list environment +); +# Configuration variables: these have to be visible from the subroutines +my ($ARRENV, + $COUNTERCMD, + $FLOATENV, + $ITEMCMD, + $LISTENV, + $MATHARRENV, + $MATHARRREPL, + $MATHENV, + $MATHREPL, + $MINWORDSBLOCK, + $PICTUREENV, + $SCALEDELGRAPHICS, + $VERBATIMENV, + $VERBATIMLINEENV, + $LSTINLINEENV, + $CUSTOMDIFCMD + ); + +# my $MINWORDSBLOCK=3; # minimum number of tokens to form an independent block +# # shorter identical blocks will be merged to the previous word +# my $SCALEDELGRAPHICS=0.5; # factor with which deleted figures will be scaled down (i.e. 0.5 implies they are shown at half linear size) +# # this is only used for --graphics-markup=BOTH option +# my $FLOATENV='(?:figure|table|plate)[\w\d*@]*' ; # Environments in which FL variants of defined commands are used +# my $PICTUREENV='(?:picture|tikzpicture|DIFnomarkup)[\w\d*@]*' ; # Environments in which all change markup is removed +# my $MATHENV='(?:equation[*]?|displaymath|DOLLARDOLLAR)[*]?' ; # Environments turning on display math mode (code also knows about \[ and \]) +# my $MATHREPL='displaymath'; # Environment introducing deleted maths blocks +# my $MATHARRENV='(?:eqnarray|align|alignat|gather|multline|flalign)[*]?' ; # Environments turning on eqnarray math mode +# my $MATHARRREPL='eqnarray*'; # Environment introducing deleted maths blocks +# my $ARRENV='(?:aligned|gathered|array|[pbvBV]?matrix|smallmatrix|cases|split)'; # Environments making arrays in math mode. The underlining style does not cope well with those - as a result in-text math environments are surrounded by \mbox{ } if any of these commands is used in an inline math block +# my $COUNTERCMD='(?:footnote|part|chapter|section|subsection|subsubsection|paragraph|subparagraph)'; # textcmds which are associated with a counter +# # If any of these commands occur in a deleted block +# # they will be succeeded by an \addtocounter{...}{-1} +# # for the associated counter such that the overall numbers +# # should be the same as in the new file +# my $LISTENV='(?:itemize|description|enumerate)'; # list making environments - they will generally be kept +# my $ITEMCMD='item'; # command marking item in a list environment + + + +my $LABELCMD='(?:label)'; # matching commands are disabled within deleted blocks - mostly useful for maths mode, as otherwise it would be fine to just not add those to SAFECMDLIST +my @UNSAFEMATHCMD=('qedhere'); # Commands which are definitely unsafe for marking up in math mode (amsmath qedhere only tested to not work with UNDERLINE markup) (only affects WHOLE and COARSE math markup modes). Note that unlike text mode (or FINE math mode0 deleted unsafe commands are not deleted but simply taken outside \DIFdel +my $MBOXINLINEMATH=0; # if set to 1 then surround marked-up inline maths expression with \mbox ( to get around compatibility + # problems between some maths packages and ulem package + + +# Markup strings +# If at all possible, do not change these as parts of the program +# depend on the actual name (particularly post-processing) +# At the very least adapt subroutine postprocess to new tokens. +my $ADDMARKOPEN='\DIFaddbegin '; # Token to mark begin of appended text +my $ADDMARKCLOSE='\DIFaddend '; # Token to mark end of appended text +my $ADDOPEN='\DIFadd{'; # To mark begin of added text passage +my $ADDCLOSE='}'; # To mark end of added text passage +my $ADDCOMMENT='DIF > '; # To mark added comment line +my $DELMARKOPEN='\DIFdelbegin '; # Token to mark begin of deleted text +my $DELMARKCLOSE='\DIFdelend '; # Token to mark end of deleted text +my $DELOPEN='\DIFdel{'; # To mark begin of deleted text passage +my $DELCLOSE='}'; # To mark end of deleted text passage +my $DELCMDOPEN='%DIFDELCMD < '; # To mark begin of deleted commands (must begin with %, i.e., be a comment +my $DELCMDCLOSE="%%%\n"; # To mark end of deleted commands (must end with a new line) +my $AUXCMD='%DIFAUXCMD' ; # follows auxiliary commands put in by latexdiff to make difference file legal + # auxiliary commands must be on a line of their own + # Note that for verbatim environment openings the %DIFAUXCMD cannot be placed in + # the same line as this would mean they are shown + # so the special form "%DIFAUXCMD NEXT" is used to indicate that the next line + # is an auxiliary command + # Similarly "%DIFAUXCMD LAST" would indicate the auxiliary command is in previous line (not currently used) +my $DELCOMMENT='DIF < '; # To mark deleted comment line +my $VERBCOMMENT='DIFVRB '; # to mark lines which are within a verbatim environment + +# main local variables: +my @TEXTCMDLIST=(); # array containing patterns of commands with text arguments +my @TEXTCMDEXCL=(); # array containing patterns of commands without text arguments (if a pattern + # matches both TEXTCMDLIST and TEXTCMDEXCL it is excluded) +my @CONTEXT1CMDLIST=(); # array containing patterns of commands with text arguments (subset of text commands), + # but which cause confusion if used out of context (e.g. \caption). + # In deleted passages, the command will be disabled but its argument is marked up + # Otherwise they behave exactly like TEXTCMD's +my @CONTEXT1CMDEXCL=(); # exclude list for above, but always empty +my @CONTEXT2CMDLIST=(); # array containing patterns of commands with text arguments, but which fail or cause confusion + # if used out of context (e.g. \title). They and their arguments will be disabled in deleted + # passages +my @CONTEXT2CMDEXCL=(); # exclude list for above, but always empty +my @MATHTEXTCMDLIST=(); # treat like textcmd. If a textcmd is in deleted or added block, just wrap the + # whole content with \DIFadd or \DIFdel irrespective of content. This functionality + # is useful for pseudo commands \MATHBLOCK.. into which math environments are being + # transformed +my @MATHTEXTCMDEXCL=(); # + +# Note I need to declare this with "our" instead of "my" because later in the code I have to "local"ise these +our @SAFECMDLIST=(); # array containing patterns of safe commands (which do not break when in the argument of DIFadd or DIFDEL) +our @SAFECMDEXCL=(); +my @MBOXCMDLIST=(); # patterns for commands which are in principle safe but which need to be surrounded by an \mbox +my @MBOXCMDEXCL=(); # all the patterns in MBOXCMDLIST will be appended to SAFECMDLIST + + +my ($i,$j,$l); +my ($old,$new); +my ($line,$key); +my (@dumlist); +my ($newpreamble,$oldpreamble); +my (@newpreamble,@oldpreamble,@diffpreamble,@diffbody); +my ($latexdiffpreamble); +my ($oldbody, $newbody, $diffbo); +my ($oldpost, $newpost); +my ($diffall); +# Option names +my ($type,$subtype,$floattype,$config,$preamblefile,$encoding,$nolabel,$visiblelabel, + $showpreamble,$showsafe,$showtext,$showconfig,$showall, + $replacesafe,$appendsafe,$excludesafe, + $replacetext,$appendtext,$excludetext, + $replacecontext1,$appendcontext1, + $replacecontext2,$appendcontext2, + $help,$verbose,$driver,$version,$ignorewarnings, + $enablecitmark,$disablecitmark,$allowspaces,$flatten,$nolinks,$debug,$earlylatexdiffpreamble); ###$disablemathmark, +my ($mboxsafe); +# MNEMNONICS for mathmarkup +my $mathmarkup; +use constant { + OFF => 0, + WHOLE => 1, + COARSE => 2, + FINE => 3 +}; +# MNEMNONICS for graphicsmarkup +my $graphicsmarkup; +use constant { + NONE => 0, + NEWONLY => 1, + BOTH => 2 +}; + +my ($mboxcmd); + +my (@configlist,@addtoconfiglist,@labels, + @appendsafelist,@excludesafelist, + @appendmboxsafelist,@excludemboxsafelist, + @appendtextlist,@excludetextlist, + @appendcontext1list,@appendcontext2list, + @packagelist); +my ($assign,@config); +# Hash where keys corresponds to the names of all included packages (including the documentclass as another package +# the optional arguments to the package are the values of the hash elements +my ($pkg,%packages); + +# Defaults +$mathmarkup=COARSE; +$verbose=0; +# output debug and intermediate files, set to 0 in final distribution +$debug=0; +# insert preamble directly after documentclass - experimental feature, set to 0 in final distribution +# Note that this failed with mini example (or other files, where packages used in latexdiff preamble +# are called again with incompatible options in preamble of resulting file) +$earlylatexdiffpreamble=0; + + +# define character properties +sub IsNonAsciiPunct { return <<'END' # Unicode punctuation but excluding ASCII punctuation ++utf8::IsPunct +-utf8::IsASCII +END +} +sub IsNonAsciiS { return <<'END' # Unicode symbol but excluding ASCII ++utf8::IsS +-utf8::IsASCII +END +} + + +my %verbhash; + +Getopt::Long::Configure('bundling'); +GetOptions('type|t=s' => \$type, + 'subtype|s=s' => \$subtype, + 'floattype|f=s' => \$floattype, + 'config|c=s' => \@configlist, + 'add-to-config=s' => \@addtoconfiglist, + 'preamble|p=s' => \$preamblefile, + 'encoding|e=s' => \$encoding, + 'label|L=s' => \@labels, + 'no-label' => \$nolabel, + 'visible-label' => \$visiblelabel, + 'exclude-safecmd|A=s' => \@excludesafelist, + 'replace-safecmd=s' => \$replacesafe, + 'append-safecmd|a=s' => \@appendsafelist, + 'exclude-textcmd|X=s' => \@excludetextlist, + 'replace-textcmd=s' => \$replacetext, + 'append-textcmd|x=s' => \@appendtextlist, + 'replace-context1cmd=s' => \$replacecontext1, + 'append-context1cmd=s' => \@appendcontext1list, + 'replace-context2cmd=s' => \$replacecontext2, + 'append-context2cmd=s' => \@appendcontext2list, + 'exclude-mboxsafecmd=s' => \@excludemboxsafelist, + 'append-mboxsafecmd=s' => \@appendmboxsafelist, + 'show-preamble' => \$showpreamble, + 'show-safecmd' => \$showsafe, + 'show-textcmd' => \$showtext, + 'show-config' => \$showconfig, + 'show-all' => \$showall, + 'packages=s' => \@packagelist, + 'allow-spaces' => \$allowspaces, + 'math-markup=s' => \$mathmarkup, + 'graphics-markup=s' => \$graphicsmarkup, + 'enable-citation-markup|enforce-auto-mbox' => \$enablecitmark, + 'disable-citation-markup|disable-auto-mbox' => \$disablecitmark, + 'verbose|V' => \$verbose, + 'ignore-warnings' => \$ignorewarnings, + 'driver=s'=> \$driver, + 'flatten' => \$flatten, + 'no-links' => \$nolinks, + 'version' => \$version, + 'help|h' => \$help, + 'debug!' => \$debug ) or die "Use latexdiff -h to get help.\n" ; + +if ( $help ) { + usage() ; +} + + +if ( $version ) { + die $versionstring ; +} + +print STDERR $versionstring if $verbose; + +if (defined($showall)){ + $showpreamble=$showsafe=$showtext=$showconfig=1; +} +# Default types +$type='UNDERLINE' unless defined($type); +$subtype='SAFE' unless defined($subtype); +# set floattype to IDENTICAL for LABEL and ONLYCHANGEDPAGE subtype, unless it has been set explicitly on the command line +$floattype=($subtype eq 'LABEL' || $subtype eq 'ONLYCHANGEDPAGE') ? 'IDENTICAL' : 'FLOATSAFE' unless defined($floattype); +if ( $subtype eq 'LABEL' ) { + print STDERR "Note that LABEL subtype is deprecated. If possible, use ZLABEL instead (requires zref package)"; +} + +if (defined($mathmarkup)) { + $mathmarkup=~tr/a-z/A-Z/; + if ( $mathmarkup eq 'OFF' ){ + $mathmarkup=OFF; + } elsif ( $mathmarkup eq 'WHOLE' ){ + $mathmarkup=WHOLE; + } elsif ( $mathmarkup eq 'COARSE' ){ + $mathmarkup=COARSE; + } elsif ( $mathmarkup eq 'FINE' ){ + $mathmarkup=FINE; + } elsif ( $mathmarkup !~ m/^[0123]$/ ) { + die "latexdiff Illegal value: ($mathmarkup) for option--math-markup. Possible values: OFF,WHOLE,COARSE,FINE,0-3\n"; + } + # else use numerical value +} + + + +# setting extra preamble commands +if (defined($preamblefile)) { + $latexdiffpreamble=join "\n",(extrapream($preamblefile),""); +} else { + $latexdiffpreamble=join "\n",(extrapream($type,$subtype,$floattype),""); +} + +if ( defined($driver) ) { + # for changebar only + $latexdiffpreamble=~s/\[dvips\]/[$driver]/sg; +} +# setting up @SAFECMDLIST and @SAFECMDEXCL +if (defined($replacesafe)) { + init_regex_arr_ext(\@SAFECMDLIST,$replacesafe); +} else { + init_regex_arr_data(\@SAFECMDLIST, "SAFE COMMANDS"); +} +foreach $appendsafe ( @appendsafelist ) { + init_regex_arr_ext(\@SAFECMDLIST, $appendsafe); +} +foreach $excludesafe ( @excludesafelist ) { + init_regex_arr_ext(\@SAFECMDEXCL, $excludesafe); +} +# setting up @MBOXCMDLIST and @MBOXCMDEXCL +foreach $mboxsafe ( @appendmboxsafelist ) { + init_regex_arr_ext(\@MBOXCMDLIST, $mboxsafe); +} +foreach $mboxsafe ( @excludemboxsafelist ) { + init_regex_arr_ext(\@MBOXCMDEXCL, $mboxsafe); +} + + + +# setting up @TEXTCMDLIST and @TEXTCMDEXCL +if (defined($replacetext)) { + init_regex_arr_ext(\@TEXTCMDLIST,$replacetext); +} else { + init_regex_arr_data(\@TEXTCMDLIST, "TEXT COMMANDS"); +} +foreach $appendtext ( @appendtextlist ) { + init_regex_arr_ext(\@TEXTCMDLIST, $appendtext); +} +foreach $excludetext ( @excludetextlist ) { + init_regex_arr_ext(\@TEXTCMDEXCL, $excludetext); +} + + +# setting up @CONTEXT1CMDLIST ( @CONTEXT1CMDEXCL exist but is always empty ) +if (defined($replacecontext1)) { + init_regex_arr_ext(\@CONTEXT1CMDLIST,$replacecontext1); +} else { + init_regex_arr_data(\@CONTEXT1CMDLIST, "CONTEXT1 COMMANDS"); +} +foreach $appendcontext1 ( @appendcontext1list ) { + init_regex_arr_ext(\@CONTEXT1CMDLIST, $appendcontext1); +} + + +# setting up @CONTEXT2CMDLIST ( @CONTEXT2CMDEXCL exist but is always empty ) +if (defined($replacecontext2)) { + init_regex_arr_ext(\@CONTEXT2CMDLIST,$replacecontext2); +} else { + init_regex_arr_data(\@CONTEXT2CMDLIST, "CONTEXT2 COMMANDS"); +} +foreach $appendcontext2 ( @appendcontext2list ) { + init_regex_arr_ext(\@CONTEXT2CMDLIST, $appendcontext2); +} + +# setting configuration variables +@config=(); +foreach $config ( @configlist ) { + if (-f $config || lc $config eq '/dev/null' ) { + open(FILE,$config) or die ("Couldn't open configuration file $config: $!"); + while () { + chomp; + next if /^\s*#/ || /^\s*%/ || /^\s*$/ ; + push (@config,$_); + } + close(FILE); + } + else { +# foreach ( split(",",$config) ) { +# push @config,$_; +# } + push @config,split(",",$config) + } +} +foreach $assign ( @config ) { + $assign=~ m/\s*(\w*)\s*=\s*(\S*)\s*$/ or die "Illegal assignment $assign in configuration list (must be variable=value)"; + exists $CONFIG{$1} or die "Unknown configuration variable $1."; + $CONFIG{$1}=$2; +} + +my @addtoconfig=(); +foreach $config ( @addtoconfiglist ) { + if (-f $config || lc $config eq '/dev/null' ) { + open(FILE,$config) or die ("Couldn't open addd-to-config file $config: $!"); + while () { + chomp; + next if /^\s*#/ || /^\s*%/ || /^\s*$/ ; + push (@addtoconfig,$_); + } + close(FILE); + } + else { +# foreach ( split(",",$config) ) { +# push @addtoconfig,$_; +# } + push @addtoconfig,split(",",$config) + } +} + +# initialise default lists from DATA +# for those configuration variables, which have not been set explicitly, initiate from list in document +foreach $key ( keys(%CONFIG) ) { + if (!defined $CONFIG{$key}) { + @dumlist=(); + init_regex_arr_data(\@dumlist,"$key CONFIG"); + $CONFIG{$key}=join(";",@dumlist) + } +} + + +foreach $assign ( @addtoconfig ) { + $assign=~ m/\s*(\w*)\s*=\s*(\S*)\s*$/ or die "Illegal assignment $assign in configuration list (must be variable=value)"; + exists $CONFIG{$1} or die "Unknown configuration variable $1."; + $CONFIG{$1}.=";$2"; +} + +# Map from hash to variables (we do this to have more concise code later, change from comma-separeted list) +foreach ( keys(%CONFIG) ) { + if ( $_ eq "MINWORDSBLOCK" ) { $MINWORDSBLOCK = $CONFIG{$_}; } + elsif ( $_ eq "FLOATENV" ) { $FLOATENV = liststringtoregex($CONFIG{$_}) ; } + elsif ( $_ eq "ITEMCMD" ) { $ITEMCMD = $CONFIG{$_} ; } + elsif ( $_ eq "LISTENV" ) { $LISTENV = liststringtoregex($CONFIG{$_}) ; } + elsif ( $_ eq "PICTUREENV" ) { $PICTUREENV = liststringtoregex($CONFIG{$_}) ; } + elsif ( $_ eq "MATHENV" ) { $MATHENV = liststringtoregex($CONFIG{$_}) ; } + elsif ( $_ eq "MATHREPL" ) { $MATHREPL = $CONFIG{$_} ; } + elsif ( $_ eq "MATHARRENV" ) { $MATHARRENV = liststringtoregex($CONFIG{$_}) ; } + elsif ( $_ eq "MATHARRREPL" ) { $MATHARRREPL = $CONFIG{$_} ; } + elsif ( $_ eq "ARRENV" ) { $ARRENV = liststringtoregex($CONFIG{$_}) ; } + elsif ( $_ eq "VERBATIMENV" ) { $VERBATIMENV = liststringtoregex($CONFIG{$_}) ; } + elsif ( $_ eq "VERBATIMLINEENV" ) { $VERBATIMLINEENV = liststringtoregex($CONFIG{$_}) ; } + elsif ( $_ eq "LSTINLINEENV" ) { $LSTINLINEENV = liststringtoregex($CONFIG{$_}) ; } + elsif ( $_ eq "CUSTOMDIFCMD" ) { $CUSTOMDIFCMD = liststringtoregex($CONFIG{$_}) ; } + elsif ( $_ eq "COUNTERCMD" ) { $COUNTERCMD = liststringtoregex($CONFIG{$_}) ; } + elsif ( $_ eq "SCALEDELGRAPHICS" ) { $SCALEDELGRAPHICS = $CONFIG{$_} ; } + else { die "Unknown configuration variable $_.";} +} + +if ( $mathmarkup == COARSE || $mathmarkup == WHOLE ) { + push(@MATHTEXTCMDLIST,qr/^MATHBLOCK(?:$MATHENV|$MATHARRENV|SQUAREBRACKET)$/); +} + + + +foreach $pkg ( @packagelist ) { + map { $packages{$_}="" } split(/,/,$pkg) ; +} + + + +if ($showconfig || $showtext || $showsafe || $showpreamble) { + show_configuration(); + exit 0; +} + +if ( @ARGV != 2 ) { + print STDERR "2 and only 2 non-option arguments required. Write latexdiff -h to get help\n"; + exit(2); +} + +# Are extra spaces between command arguments permissible? +my $extraspace; +if ($allowspaces) { + $extraspace='\s*'; +} else { + $extraspace=''; +} + +# append context lists to text lists (as text property is implied) +push @TEXTCMDLIST, @CONTEXT1CMDLIST; +push @TEXTCMDLIST, @CONTEXT2CMDLIST; + +push @TEXTCMDLIST, @MATHTEXTCMDLIST if $mathmarkup==COARSE; + +# internal additions to SAFECMDLIST +push(@SAFECMDLIST, qr/^QLEFTBRACE$/, qr/^QRIGHTBRACE$/); + + +# Patterns. These are used by some of the subroutines, too +# I can only define them down here because value of extraspace depends on an option + + my $pat0 = '(?:[^{}])*'; + my $pat_n = $pat0; +# if you get "undefined control sequence MATHBLOCKmath" error, increase the maximum value in this loop + for (my $i_pat = 0; $i_pat < 20; ++$i_pat){ + $pat_n = '(?:[^{}]|\{'.$pat_n.'\}|\\\\\{|\\\\\})*'; + # Actually within the text body, quoted braces are replaced in pre-processing. The only place where + # the last part of the pattern matters is when processing the arguments of context2cmds in the preamble + # and these contain a \{ or \} combination, probably rare. + # It should thus be fine to use the simpler version below. + ### $pat_n = '(?:[^{}]|\{'.$pat_n.'\})*'; + } + + my $brat0 = '(?:[^\[\]]|\\\[|\\\])*'; + my $brat_n = $brat0; + for (my $i_pat = 0; $i_pat < 4; ++$i_pat){ + $brat_n = '(?:[^\[\]]|\['.$brat_n.'\]|\\\[|\\\])*'; + ### $brat_n = '(?:[^\[\]]|\['.$brat_n.'\])*'; # Version not taking into account escaped \[ and \] + } + my $abrat0 = '(?:[^<>])*'; + + my $quotemarks = '(?:\'\')|(?:\`\`)'; + my $punct='[0.,\/\'\`:;\"\?\(\)\[\]!~\p{IsNonAsciiPunct}\p{IsNonAsciiS}]'; + my $number='-?\d*\.\d*'; + my $mathpunct='[+=<>\-\|]'; + my $and = '&'; + my $coords= '[\-.,\s\d]*'; +# quoted underscore - this needs special treatment as perl treats _ as a letter (\w) but latex does not +# such that a\_b is interpreted as a{\_}b by latex but a{\_b} by perl + my $quotedunderscore='\\\\_'; +# word: sequence of letters or accents followed by letter + my $word_ja='\p{Han}+|\p{InHiragana}+|\p{InKatakana}+'; + my $word='(?:' . $word_ja . '|(?:(?:[-\w\d*]|\\\\[\"\'\`~^][A-Za-z\*])(?!(?:' . $word_ja . ')))+)'; + my $cmdleftright='\\\\(?:left|right|[Bb]igg?[lrm]?|middle)\s*(?:[<>()\[\]|\.]|\\\\(?:[|{}]|\w+))'; + my $cmdoptseq='\\\\[\w\d@\*]+'.$extraspace.'(?:(?:<'.$abrat0.'>|\['.$brat_n.'\]|\{'. $pat_n . '\}|\(' . $coords .'\))'.$extraspace.')*'; + my $defseq='\\\\def\\\\[\w\d@\*]+(?:#\d+|\[#\d+\])+(?:\{'. $pat_n . '\})?'; + my $backslashnl='\\\\\n'; + my $oneletcmd='\\\\.\*?(?:\['.$brat_n.'\]|\{'. $pat_n . '\})*'; + my $math='\$(?:[^$]|\\\$)*?\$|\\\\[(](?:.|\n)*?\\\\[)]'; +## the current maths command cannot cope with newline within the math expression + my $comment='%[^\n]*\n'; + my $pat=qr/(?:\A\s*)?(?:${and}|${quotemarks}|${number}|${word}|$quotedunderscore|${defseq}|$cmdleftright|${cmdoptseq}|${math}|${backslashnl}|${oneletcmd}|${comment}|${punct}|${mathpunct}|\{|\})\s*/ ; + + + + +# now we are done setting up and can start working +my ($oldfile, $newfile) = @ARGV; +# check for existence of input files +if ( ! -e $oldfile ) { + die "Input file $oldfile does not exist"; +} +if ( ! -e $newfile ) { + die "Input file $newfile does not exist"; +} + + +# set the labels to be included into the file +# first find out which file name is longer for correct alignment +my ($diff,$oldlabel_n_spaces,$newlabel_n_spaces); +$oldlabel_n_spaces = 0; +$newlabel_n_spaces = 0; +$diff = length($newfile) - length($oldfile); +if ($diff > 0) { + $oldlabel_n_spaces = $diff; +} +if ($diff < 0) { + $newlabel_n_spaces = abs($diff); +} + +my ($oldtime,$newtime,$oldlabel,$newlabel); +if (defined($labels[0])) { + $oldlabel=$labels[0] ; +} else { + $oldtime=localtime((stat($oldfile))[9]); + $oldlabel="$oldfile " . " "x($oldlabel_n_spaces) . $oldtime; +} +if (defined($labels[1])) { + $newlabel=$labels[1] ; +} else { + $newtime=localtime((stat($newfile))[9]); + $newlabel="$newfile " . " "x($newlabel_n_spaces) . $newtime; +} + +$encoding=guess_encoding($newfile) unless defined($encoding); + +$encoding = "utf8" if $encoding =~ m/^utf8/i ; +if (lc($encoding) eq "utf8" ) { + binmode(STDOUT, ":utf8"); + binmode(STDERR, ":utf8"); +} + +$old=read_file_with_encoding($oldfile,$encoding); +$new=read_file_with_encoding($newfile,$encoding); + + + + +# reset time +exetime(1); +($oldpreamble,$oldbody,$oldpost)=splitdoc($old,'\\\\begin\{document\}','\\\\end\{document\}'); + +($newpreamble,$newbody,$newpost)=splitdoc($new,'\\\\begin\{document\}','\\\\end\{document\}'); + + +if ($flatten) { + $oldbody=flatten($oldbody,$oldpreamble,$oldfile,$encoding); + $newbody=flatten($newbody,$newpreamble,$newfile,$encoding); + # flatten preamble + $oldpreamble=flatten($oldpreamble,$oldpreamble,$oldfile,$encoding); + $newpreamble=flatten($newpreamble,$newpreamble,$newfile,$encoding); + +} + + + + +my @auxlines; + +# boolean variab +my ($ulem)=0; + +if ( length $oldpreamble && length $newpreamble ) { + # pre-process preamble by looking for commands used in \maketitle (title, author, date etc commands) + # and marking up content with latexdiff markup + @auxlines=preprocess_preamble($oldpreamble,$newpreamble); + + @oldpreamble = split /\n/, $oldpreamble; + @newpreamble = split /\n/, $newpreamble; + + # If a command is defined in the preamble of the new file, and only uses safe commands, then it can be considered to be safe) (contribution S. Gouezel) + # Base this assessment on the new preamble + add_safe_commands($newpreamble); + + # get a list of packages from preamble if not predefined + %packages=list_packages($newpreamble) unless %packages; + if ( %packages && $debug ) { my $key ; foreach $key (keys %packages) { print STDERR "DEBUG \\usepackage[",$packages{$key},"]{",$key,"}\n" ;} } +} + +# have to return to all processing to properly add preamble additions based on packages found +if (defined($graphicsmarkup)) { + $graphicsmarkup=~tr/a-z/A-Z/; + if ( $graphicsmarkup eq 'OFF' or $graphicsmarkup eq 'NONE' ) { + $graphicsmarkup=NONE; + } elsif ( $graphicsmarkup eq 'NEWONLY' or $graphicsmarkup eq 'NEW-ONLY' ) { + $graphicsmarkup=NEWONLY; + } elsif ( $graphicsmarkup eq 'BOTH' ) { + $graphicsmarkup=BOTH; + } elsif ( $graphicsmarkup !~ m/^[012]$/ ) { + die "latexdiff Illegal value: ($graphicsmarkup) for option --highlight-graphics. Possible values: OFF,WHOLE,COARSE,FINE,0-2\n"; + } + # else use numerical value +} else { + # Default: no explicit setting in menu + if ( defined $packages{"graphicx"} or defined $packages{"graphics"} ) { + $graphicsmarkup=NEWONLY; + } else { + $graphicsmarkup=NONE; + } +} + +if (defined $packages{"hyperref"} ) { + # deleted lines should not generate or appear in link names: + print STDERR "hyperref package detected.\n" if $verbose ; + $latexdiffpreamble =~ s/\{\\DIFadd\}/{\\DIFaddtex}/g; + $latexdiffpreamble =~ s/\{\\DIFdel\}/{\\DIFdeltex}/g; + $latexdiffpreamble .= join "\n",(extrapream("HYPERREF"),""); + if($nolinks){ + $latexdiffpreamble .= "\n\\hypersetup{bookmarks=false}"; + } + ### $latexdiffpreamble .= '%DIF PREAMBLE EXTENSION ADDED BY LATEXDIFF FOR HYPERREF PACKAGE' . "\n"; + ### $latexdiffpreamble .= '\providecommand{\DIFadd}[1]{\texorpdfstring{\DIFaddtex{#1}}{#1}}' . "\n"; + ### $latexdiffpreamble .= '\providecommand{\DIFdel}[1]{\texorpdfstring{\DIFdeltex{#1}}{}}' . "\n"; + ### $latexdiffpreamble .= '%DIF END PREAMBLE EXTENSION ADDED BY LATEXDIFF FOR HYPERREF PACKAGE' . "\n"; +} + +# add commands for figure highlighting to preamble +if ($graphicsmarkup != NONE ) { + my @matches; + # Check if \DIFaddbeginFL definition calls \DIFaddbegin - if so we will issue an error message that graphics highlighting is + # is not compatible with this. + # (A more elegant solution would be to suppress the redefinitions of the \DIFaddbeginFL etc commands, but for this narrow use case + # I currently don't see this as an efficient use of time) + ### The foreach loop does not make sense here. I don't know why I put this in - (F Tilmann) + ###foreach my $cmd ( "DIFaddbegin","DIFaddend","DIFdelbegin","DIFdelend" ) { + @matches=( $latexdiffpreamble =~ m/command\{\\DIFaddbeginFL}\{($pat_n)}/sg ) ; + # we look at the last one of the list to take into account possible redefinition but almost always matches should have exactly one element + if ( $matches[$#matches] =~ m/\\DIFaddbegin/ ) { + die "Cannot combine graphics markup with float styles defining \\DIFaddbeginFL in terms of \\DIFaddbegin. Use --graphics-markup=none option or choose a different float style."; + exit 10; + } + ###} + $latexdiffpreamble .= join "\n",("\\newcommand{\\DIFscaledelfig}{$SCALEDELGRAPHICS}",extrapream("HIGHLIGHTGRAPHICS"),""); + + # only change required for highlighting both is to declare \includegraphics safe, as preamble already contains commands for deleted environment + if ( $graphicsmarkup == BOTH ) { + init_regex_arr_list(\@SAFECMDLIST,'includegraphics'); + } +} + +$ulem = ($latexdiffpreamble =~ /\\RequirePackage(?:\[$brat_n\])?\{ulem\}/ || defined $packages{"ulem"}); + + +# If listings is being used or can be found in the latexdiff search path, add to the preamble auxiliary code to enable line-by-line markup +if ( defined($packages{"listings"}) or `kpsewhich listings.sty` ne "" ) { + my @listingpreamble=extrapream("LISTINGS"); + my @listingDIFcode=(); + my $replaced; + # note that in case user supplies preamblefile the type might not reflect well the + @listingDIFcode=extrapream("-nofail","DIFCODE_" . $type) unless defined($preamblefile); + if (!(@listingDIFcode)) { + # if listingDIFcode is empty try to guess a suitable one from the preamble + if ($latexdiffpreamble =~ /\\RequirePackage(?:\[$brat_n\])?\{color\}/ and $ulem ) { + @listingDIFcode=extrapream("DIFCODE_UNDERLINE"); + } elsif ( $latexdiffpreamble =~ /\\RequirePackage(?:\[$brat_n\])?\{color\}/ ) { + # only colour used + @listingDIFcode=extrapream("DIFCODE_CFONT"); + } else { + # fall-back solution + @listingDIFcode=extrapream("DIFCODE_BOLD"); + } + } + # now splice it in + $replaced=0; + ###print STDERR "DEBUG: listingDIFcode: ",join("\n",@listingDIFcode),"|||\n" if $debug; + + @listingpreamble=grep { + # only replace if this has not been done already (use short-circuit property of and) + if (!$replaced and $_ =~ s/^.*%DIFCODE TEMPLATE.*$/join("\n",@listingDIFcode)/e ) { + ###print STDERR "DEBUG: Replaced text $_\n" if $debug; + $replaced=1; + 1; + } else { + # return false for those lines matching %DIFCODE TEMPLATE (so that they are not included in output) + not m/%DIFCODE TEMPLATE/; + } + } @listingpreamble; + ### print STDERR "DEBUG: listingpreamble @listingpreamble\n"; + $latexdiffpreamble .= join "\n",(@listingpreamble,""); +} else { + print STDERR "WARNING: listings package not detected. Disabling mark-up in verbatim environments \n" ; + # if listings does not exist disable line-by-line markup and treat all verbatim environments as opaque + $VERBATIMENV = liststringtoregex($CONFIG{VERBATIMENV}.";".$CONFIG{VERBATIMLINEENV}); + $VERBATIMLINEENV = ""; +} + +# adding begin and end marker lines to preamble +$latexdiffpreamble = "%DIF PREAMBLE EXTENSION ADDED BY LATEXDIFF\n" . $ latexdiffpreamble . "%DIF END PREAMBLE EXTENSION ADDED BY LATEXDIFF\n"; + +# and return to preamble specific processing +if ( length $oldpreamble && length $newpreamble ) { + print STDERR "Differencing preamble.\n" if $verbose; + + # insert dummy first line such that line count begins with line 1 (rather than perl's line 0) - just so that line numbers inserted by linediff are correct + unshift @newpreamble,''; + unshift @oldpreamble,''; + @diffpreamble = linediff(\@oldpreamble, \@newpreamble); + # remove dummy line again + shift @diffpreamble; + # add filenames, modification time and latexdiff mark + defined($nolabel) or splice @diffpreamble,1,0, + "%DIF LATEXDIFF DIFFERENCE FILE", + ,"%DIF DEL $oldlabel", + "%DIF ADD $newlabel"; + if ( @auxlines ) { + push @diffpreamble,"%DIF DELETED TITLE COMMANDS FOR MARKUP"; + push @diffpreamble,join("\n",@auxlines); + } + if ( $earlylatexdiffpreamble) { + # insert latexdiff command directly after documentclass at beginning of preamble + # note that grep is only run for its side effect + ( grep { s/^([^%]*\\documentclass.*)$/$1$latexdiffpreamble/ } @diffpreamble )==1 or die "Could not find documentclass statement in preamble"; + } else { + # insert latexdiff commands at the end of preamble (default behaviour) + push @diffpreamble,$latexdiffpreamble; + } + push @diffpreamble,'\begin{document}'; + if (defined $packages{"hyperref"} && $nolinks) { + push @diffpreamble, '\begin{NoHyper}'; + } +} +elsif ( !length $oldpreamble && !length $newpreamble ) { + @diffpreamble=(); +} else { + print STDERR "Either both texts must have preamble or neither text must have the preamble.\n"; + exit(2); +} + +# Special: treat all cite commands as safe except in UNDERLINE and FONTSTRIKE mode +# (there is a conflict between citation and ulem package, see +# package documentation) +# Use post-processing +# and $packages{"apacite"}!~/natbibpapa/ + + +if (defined $packages{"units"} && $ulem ) { + # protect inlined maths environments by surrounding with an \mbox + # this is done to get around an incompatibility between the ulem and units package + # where spaces in the argument to underlined or crossed-out \unit commands cause an error message + print STDERR "units package detected at the same time as style using ulem.\n" if $verbose ; + $MBOXINLINEMATH=1; +} + +if (defined $packages{"siunitx"} ) { + # protect SI command by surrounding them with an \mbox + # this is done to get around an incompatibility between the ulem and siunitx package + print STDERR "siunitx package detected.\n" if $verbose ; + my $mboxcmds='SI,ang,numlist,numrange,SIlist,SIrange'; + init_regex_arr_list(\@SAFECMDLIST,'num,si'); + if ( $enablecitmark || ( $ulem && ! $disablecitmark )) { + init_regex_arr_list(\@MBOXCMDLIST,$mboxcmds); + } else { + init_regex_arr_list(\@SAFECMDLIST,$mboxcmds); + } +} + +if (defined $packages{"cleveref"} ) { + # protect selected command by surrounding them with an \mbox + # this is done to get around an incompatibility between ulem and cleveref package + print STDERR "cleveref package detected.\n" if $verbose ; + my $mboxcmds='[Cc]ref(?:range)?\*?,labelcref,(?:lc)?name[cC]refs?' ; + if ( $enablecitmark || ( $ulem && ! $disablecitmark )) { + init_regex_arr_list(\@MBOXCMDLIST,$mboxcmds); + } else { + init_regex_arr_list(\@SAFECMDLIST,$mboxcmds); + } +} + +if (defined $packages{"glossaries"} ) { + # protect selected command by surrounding them with an \mbox + # this is done to get around an incompatibility between ulem and glossaries package + print STDERR "glossaries package detected.\n" if $verbose ; + my $mboxcmds='[gG][lL][sS](?:|pl|disp|link|first|firstplural|desc|user[iv][iv]?[iv]?),[aA][cC][rR](?:long|longpl|full|fullpl),[aA][cC][lfp]?[lfp]?'; + init_regex_arr_list(\@SAFECMDLIST,'[gG][lL][sS](?:(?:entry)?(?:text|plural|name|symbol)|displaynumberlist|entryfirst|entryfirstplural|entrydesc|entrydescplural|entrysymbolplural|entryuser[iv][iv]?[iv]?|entrynumberlist|entrydisplaynumberlist|entrylong|entrylongpl|entryshort|entryshortpl|entryfull|entryfullpl),[gG]lossentry(?:name|desc|symbol),[aA][cC][rR](?:short|shortpl),[aA]csp?'); + if ( $enablecitmark || ( $ulem && ! $disablecitmark )) { + init_regex_arr_list(\@MBOXCMDLIST,$mboxcmds); + } else { + init_regex_arr_list(\@SAFECMDLIST,$mboxcmds); + } +} + +if (defined $packages{"chemformula"} or defined $packages{"chemmacros"} ) { + print STDERR "chemformula package detected.\n" if $verbose ; + init_regex_arr_list(\@SAFECMDLIST,'ch'); + push(@UNSAFEMATHCMD,'ch'); + # The next command would be needed to allow highlighting the interior of \ch commands in math environments + # but the redefinitions in chemformula are too deep to make this viable + # push(@MATHTEXTCMDLIST,'ch'); +} + +if (defined $packages{"mhchem"} ) { + print STDERR "mhchem package detected.\n" if $verbose ; + init_regex_arr_list(\@SAFECMDLIST,'ce'); + push(@UNSAFEMATHCMD,'ce','cee'); + # The next command would be needed to allow highlighting the interior of \cee commands in math environments + # but the redefinitions in chemformula are too deep to make this viable + # push(@MATHTEXTCMDLIST,'cee'); +} + + +my ( $citpat); + +if ( defined $packages{"apacite"} ) { + print STDERR "apacite package detected.\n" if $verbose ; + $citpat='(?:mask)?(?:full|short|no)?cite(?:A|author|year|meta)?(?:NP)?'; +} else { + # citation command pattern for all other citation schemes + $citpat='(?:cite\w*|nocite)'; +}; + +if ( ! $ulem ) { + # modes not using ulem: citation is safe + push (@SAFECMDLIST, $citpat); +} else { + ### Experimental: disable text and emph commands + push(@SAFECMDEXCL, qr/^emph$/, qr/^text..$/); + # replace \cite{..} by \mbox{\cite{..}} in added or deleted blocks in post-processing + push(@MBOXCMDLIST,$citpat) unless $disablecitmark; + if ( uc($subtype) eq "COLOR" or uc($subtype) eq "DVIPSCOL" ) { + # remove \cite command again from list of safe commands + pop @MBOXCMDLIST; + # deleted cite commands + } +} +push(@MBOXCMDLIST,$citpat) if $enablecitmark ; + + +if (defined $packages{"amsmath"} or defined $packages{"amsart"} or defined $packages{"amsbook"} ) { + print STDERR "amsmath package detected.\n" if $verbose ; + $MATHARRREPL='align*'; +} + +# add commands in MBOXCMDLIST to SAFECMDLIST +foreach $mboxcmd ( @MBOXCMDLIST ) { + init_regex_arr_list(\@SAFECMDLIST, $mboxcmd); +} + +# check if \label is in SAFECMDLIST, and if yes replace "label" in $LABELCMD by something that never matches (we hope!) +if ( iscmd("label",\@SAFECMDLIST,\@SAFECMDEXCL) ) { + $LABELCMD=~ s/label/NEVERMATCHLABEL/; +} + + + +print STDERR "Preprocessing body. " if $verbose; +preprocess($oldbody,$newbody); + + +# run difference algorithm +@diffbody=bodydiff($oldbody, $newbody); +$diffbo=join("",@diffbody); +if ( $debug ) { + open(RAWDIFF,">","latexdiff.debug.bodydiff"); + print RAWDIFF $diffbo; + close(RAWDIFF); +} +print STDERR "(",exetime()," s)\n","Postprocessing body. \n" if $verbose; +postprocess($diffbo); +$diffall =join("\n",@diffpreamble) ; +# add visible labels +if (defined($visiblelabel)) { + # Give information right after \begin{document} (or at the beginning of the text for files without preamble + ### if \date command is used, add information to \date argument, otherwise give right after \begin{document} + ### $diffall=~s/(\\date$extraspace(?:\[$brat0\])?$extraspace)\{($pat_n)\}/$1\{$2 \\ LATEXDIFF comparison \\ Old: $oldlabel \\ New: $newlabel \}/ or + $diffbo = "\\begin{verbatim}LATEXDIFF comparison\nOld: $oldlabel\nNew: $newlabel\\end{verbatim}\n$diffbo" ; +} + +$diffall .= "$diffbo" ; +if (defined $packages{"hyperref"} && $nolinks) { + $diffall .= "\\end{NoHyper}\n"; +} +$diffall .= "\\end{document}$newpost" if length $newpreamble ; +if ( lc($encoding) ne "utf8" && lc($encoding) ne "ascii" ) { + print STDERR "Encoding output file to $encoding\n" if $verbose; + $diffall=Encode::encode($encoding,$diffall); + binmode STDOUT; +} +print $diffall; + + +print STDERR "(",exetime()," s)\n","Done.\n" if $verbose; + + +# liststringtoregex(liststring) +# expands string with semi-colon separated list into a regular expression corresponding +# matching any of the elements +sub liststringtoregex { + my ($liststring)=@_; + my @elements=grep /\S/,split(";",$liststring); + if ( @elements) { + return('(?:(?:' . join(')|(?:',@elements) .'))'); + } else { + return ""; + } +} + +# show_configuration +# note that this is not encapsulated but uses variables from the main program +# It is provided for convenience because in the future it is planned to allow output +# to be modified based on what packages are read etc - this works only if the input files are actually read +# whether or not additional files are provided +sub show_configuration { + if ($showpreamble) { + print "\nPreamble commands:\n"; + print $latexdiffpreamble ; + } + + if ($showsafe) { + print "\nsafecmd: Commands safe within scope of $ADDOPEN $ADDCLOSE and $DELOPEN $DELCLOSE (unless excluded):\n"; + print_regex_arr(@SAFECMDLIST); + print "\nsafecmd-exlude: Commands not safe within scope of $ADDOPEN $ADDCLOSE and $DELOPEN $DELCLOSE :\n"; + print_regex_arr(@SAFECMDEXCL); + print "\nmboxsafecmd: Commands safe only if they are surrounded by \\mbox command:\n"; + print_regex_arr(@MBOXCMDLIST); + print "\nnmboxsafecmd: Commands not safe:\n"; + print_regex_arr(@MBOXCMDEXCL); + } + + if ($showtext) { + print "\nCommands with last argument textual (unless excluded) and safe in every context:\n"; + print_regex_arr(@TEXTCMDLIST); + print "\nContext1 commands (last argument textual, command will be disabled in deleted passages, last argument will be shown as plain text):\n"; + print_regex_arr(@CONTEXT1CMDLIST); + print "\nContext2 commands (last argument textual, command and its argument will be disabled in deleted passages):\n"; + print_regex_arr(@CONTEXT2CMDLIST); + print "\nExclude list of Commands with last argument not textual (overrides patterns above):\n"; + print_regex_arr(@TEXTCMDEXCL); + } + + + if ($showconfig) { + print "Configuration variables:\n"; + print "ARRENV=$ARRENV\n"; + print "COUNTERCMD=$COUNTERCMD\n"; + print "FLOATENV=$FLOATENV\n"; + print "ITEMCMD=$ITEMCMD\n"; + print "LISTENV=$LISTENV\n"; + print "MATHARRENV=$MATHARRENV\n"; + print "MATHARRREPL=$MATHARRREPL\n"; + print "MATHENV=$MATHENV\n"; + print "MATHREPL=$MATHREPL\n"; + print "MINWORDSBLOCK=$MINWORDSBLOCK\n"; + print "PICTUREENV=$PICTUREENV\n"; + print "SCALEDELGRAPHICS=$SCALEDELGRAPHICS\n"; + print "VERBATIMENV=$VERBATIMENV\n"; + print "VERBATIMLINEENV=$VERBATIMLINEENV\n"; + print "LSTINLINEENV=$LSTINLINEENV\n"; + print "CUSTOMDIFCMD=$CUSTOMDIFCMD\n"; + } +} + + + +## guess_encoding(filename) +## reads the first 20 lines of filename and looks for call of inputenc package +## if found, return the option of this package (encoding), otherwise return utf8 +sub guess_encoding { + my ($filename)=@_; + my ($i,$enc); + open (FH, $filename) or die("Couldn't open $filename: $!"); + $i=0; + while () { + next if /^\s*%/; # skip comment lines + if (m/\\usepackage\[(\w*?)\]\{inputenc\}/) { + close(FH); + return($1); + } + last if (++$i > 20 ); # scan at most 20 non-comment lines + } + close(FH); + ### return("ascii"); + return("utf8"); +} + + +sub read_file_with_encoding { + my ($output); + my ($filename, $encoding) = @_; + + if (lc($encoding) eq "utf8" ) { + open (FILE, "<:utf8",$filename) or die("Couldn't open $filename: $!"); + local $/ ; # locally set record operator to undefined, ie. enable whole-file mode + $output=; + } elsif ( lc($encoding) eq "ascii") { + open (FILE, $filename) or die("Couldn't open $filename: $!"); + local $/ ; # locally set record operator to undefined, ie. enable whole-file mode + $output=; + } else { + require Encode; + open (FILE, "<",$filename) or die("Couldn't open $filename: $!"); + local $/ ; # locally set record operator to undefined, ie. enable whole-file mode + $output=; + print STDERR "Converting $filename from $encoding to utf8\n" if $verbose; + $output=Encode::decode($encoding,$output); + } + close FILE; + if ($^O eq "linux" ) { + $output =~ s/\r\n/\n/g ; + } + return $output; +} + +## %packages=list_packages(@preamble) +## scans the arguments for \documentclass,\RequirePackage and \usepackage statements and constructs a hash +## whose keys are the included packages, and whose values are the associated optional arguments +#sub list_packages { +# my (@preamble)=@_; +# my %packages=(); +# foreach $line ( @preamble ) { +# # get rid of comments +# $line=~s/(?catfile($dirname,$fname); + print STDERR "DEBUG Beg of line match |$1|\n" if defined($1) && $debug ; + print STDERR "Include file $fname\n" if $verbose; + print STDERR "DEBUG looking for file ",$fullfile, "\n" if $debug; + # content of file becomes replacement value (use recursion), add \newpage if the command was include + if ( -f $fullfile ) { + # If file exists, replace input or include command with expanded input + $replacement=flatten(read_file_with_encoding($fullfile, $encoding), $preamble,$filename,$encoding) or die "Could not open file ",$fullfile,": $!"; + $replacement = remove_endinput($replacement); + # \include always starts a new page; use explicit \newpage command to simulate this + $newpage=(defined($4)? " \\newpage " : "") ; + } else { + # if file does not exist, do not expand include or input command (do not warn if fname contains #[0-9] as it is then likely part of a command definition + # and is not meant to be expanded directly + print STDERR "WARNING: Could not find included file ",$fullfile,". I will continue but not expand |$2|\n" unless $fname =~ m(#[0-9]) ; + $replacement = $2 ; # i.e. just the original command again -> make no change file does not exist + $newpage=""; + } + "$begline$newpage$replacement$newpage"; + }/exgm; + + # replace bibliography with bbl file if it exists + $text=~s/(^(?:[^%\n]|\\%)*)\\bibliography\{(.*?)\}/{ + if ( -f $bblfile ){ + $replacement=read_file_with_encoding(File::Spec->catfile($bblfile), $encoding); + } else { + warn "Bibliography file $bblfile cannot be found. No flattening of \\bibliography done. Run bibtex on old and new files first"; + $replacement="\\bibliography{$2}"; + } + $begline=(defined($1)? $1 : "") ; + "$begline$replacement"; + }/exgm; + + # replace subfile with contents (subfile package) + $text=~s/(^(?:[^%\n]|\\%)*)\\subfile\{(.*?)\}/{ + $begline=(defined($1)? $1 : "") ; + $fname = $2; + # # add tex extension unless there is a three or four letter extension already + $fname .= ".tex" unless $fname =~ m|\.\w{3,4}|; + print STDERR "Include file as subfile $fname\n" if $verbose; + # content of file becomes replacement value (use recursion) + # now strip away everything outside and including \begin{document} and \end{document} pair# + # # note: no checking for comments is made + $fullfile=File::Spec->catfile($dirname,$fname); + if ( -f $fullfile) { + # if file exists, expand \subfile command by contents of file + $subfile=read_file_with_encoding($fullfile,$encoding) or die "Could not open included subfile ",$fullfile,": $!"; + ($subpreamble,$subbody,$subpost)=splitdoc($subfile,'\\\\begin\{document\}','\\\\end\{document\}'); + ### $subfile=~s|^.*\\begin{document}||s; + ### $subfile=~s|\\end{document}.*$||s; + $replacement=flatten($subbody, $preamble,$filename,$encoding); + ### $replacement = remove_endinput($replacement); + } else { + # if file does not exist, do not expand subfile + print STDERR "WARNING: Could not find subfile ",$fullfile,". I will continue but not expand |$2|\n" unless $fname =~ m(#[0-9]) ; + $replacement = "\\subfile\{$2\}" ; # i.e. just the original command again -> make no change file does not exist + } + + "$begline$replacement"; + }/exgm; + + # replace \verbatiminput and \lstlistinginput + $text=~s/(^(?:[^%\n]|\\%)*)\\(verbatiminput\*?|lstinputlisting)$extraspace(\[$brat_n\])?$extraspace\{(.*?)\}/{ + $begline=(defined($1)? $1 : "") ; + $command = $2 ; + $fname = $4 ; + $verboptions = defined($3)? $3 : "" ; + if ($command eq 'verbatiminput' ) { + $verbenv = "verbatim" ; + } elsif ($command eq 'verbatiminput*' ) { + $verbenv = "verbatim*" ; + } elsif ($command eq 'lstinputlisting' ) { + $verbenv = "lstlisting" ; + } else { + die "Internal errorL Unexpected verbatim input type $command.\n"; + } + print STDERR "DEBUG Beg of line match |$begline|\n" if $debug ; + print STDERR "Include file $fname verbatim\n" if $verbose; + print STDERR "DEBUG looking for file ",File::Spec->catfile($dirname,$fname), "\n" if $debug; + # content of file becomes replacement value (do not use recursion), add \newpage if the command was include + ###$replacement=read_file_with_encoding(File::Spec->catfile($dirname,$fname), $encoding) or die "Couldn't find file ",File::Spec->catfile($dirname,$fname),": $!"; + $replacement=read_file_with_encoding(File::Spec->catfile($dirname,$fname), $encoding) or die "Couldn't find file ",File::Spec->catfile($dirname,$fname),": $!"; + # Add a new line if it not already there (note that the matching operator needs to use different delimiters, as we are still inside an outer scope that takes precedence + $replacement .= "\n" unless $replacement =~ m(\n$) ; + "$begline\\begin{$verbenv}$verboptions\n$replacement\\end{$verbenv}\n"; + }/exgm; + + return($text); +} + + +# print_regex_arr(@arr) +# prints regex array without x-ism expansion put in by pearl to stdout +sub print_regex_arr { + my $dumstring; + $dumstring = join(" ",@_); # PERL generates string (?-xism:^ref$) for quoted refex ^ref$ + $dumstring =~ s/\(\?-xism:\^(.*?)\$\)/$1/g; # remove string and ^,$ marks before output + print $dumstring,"\n"; +} + + +# @lines=extrapream($type,...) +# reads line from appendix or external file +# (end of file after __END__ token) +# if $type is a filename, it will read the file instead of reading from the appendix +# otherwise it will screen appendix for line "%DIF $TYPE" and copy everything up to line +# '%DIF END $TYPE' (where $TYPE is upcased version of $type) +# extrapream('-nofail',$type) will---instead of failing---simply return nothing if +# it does not find the matching line in a appendix (do not use -nofail option with multiple types!) +sub extrapream { + my @types=@_; + my ($type,$arg); + my $nofail=0; + ###my @retval=("%DIF PREAMBLE EXTENSION ADDED BY LATEXDIFF") ; + my @retval=(); + my ($copy); + + foreach $arg ( @types ) { + if ( $arg eq '-nofail' ) { + $nofail=1; + next; + } + $type=$arg; + $copy=0; + if ( -f $type || lc $type eq '/dev/null' ) { + open (FILE,$type) or die "Cannot open preamble file $type: $!"; + print STDERR "Reading preamble file $type\n" if $verbose ; + while () { + chomp ; + if ( $_ =~ m/%DIF PREAMBLE/ ) { + push (@retval,"$_"); + } else { + push (@retval,"$_ %DIF PREAMBLE"); + } + } + } else { # not (-f $type) + $type=uc($type); # upcase argument + print STDERR "Preamble Internal Type $type\n" if $verbose; + # save filehandle position (before first read this points to line after __END__) + # but seek DATA,0,0 resets it to the beginning of the file + # see https://stackoverflow.com/questions/4459601/how-can-i-use-data-twice + my $data_start = tell DATA; + while () { + if ( m/^%DIF $type/ ) { + $copy=1; + } elsif ( m/^%DIF END $type/ ) { + last; + } + chomp; + push (@retval,"$_ %DIF PREAMBLE") if $copy; + } + if ( $copy == 0 ) { + unless ($nofail) { + print STDERR "\nPreamble style $type not implemented.\n"; + print STDERR "Write latexdiff -h to get help with available styles\n"; + exit(2); + } + } + seek DATA,$data_start,0; # rewind DATA handle to beginning of data record + } + } + ###push (@retval,"%DIF END PREAMBLE EXTENSION ADDED BY LATEXDIFF") ; + return @retval; +} + + +# ($part1,$part2,$part3)=splitdoc($text,$word1,$word2) +# splits $text into 3 parts at $word1 and $word2. +# if neither $word1 nor $word2 exist, $part1 and $part3 are empty, $part2 is $text +# If only $word1 or $word2 exist but not the other, output an error message. + +# NB this version avoids $` and $' for performance reason although it only makes a tiny difference +# (in one test gain a tenth of a second for a 30s run) +sub splitdoc { + my ($text,$word1,$word2)=@_; + my ($part1,$part2,$part3)=("","",""); + my ($rest,$pos); + + if ( $text =~ m/(^[^%]*)($word1)/mg ) { + $pos=pos $text; + $part1=substr($text,0,$pos-length($2)); + $rest=substr($text,$pos); + if ( $rest =~ m/(^[^%]*)($word2)/mg ) { + $pos=pos $rest; + $part2=substr($rest,0,$pos-length($2)); + $part3=substr($rest,$pos); + } + else { + die "$word1 and $word2 not in the correct order or not present as a pair." ; + } + } else { + $part2=$text; + die "$word2 present but not $word1." if ( $text =~ m/(^[^%]*)$word2/ms ); + } + return ($part1,$part2,$part3); +} + + + + + +# bodydiff($old,$new) +sub bodydiff { + my ($oldwords, $newwords) = @_; + my @retwords; + + print STDERR "(",exetime()," s)\n","Splitting into latex tokens \n" if $verbose; + print STDERR "Parsing $oldfile \n" if $verbose; + my @oldwords = splitlatex($oldwords); + print STDERR "Parsing $newfile \n" if $verbose; + my @newwords = splitlatex($newwords); + + if ( $debug ) { + open(TOKENOLD,">","latexdiff.debug.tokenold"); + print TOKENOLD join("***\n",@oldwords); + close(TOKENOLD); + open(TOKENNEW,">","latexdiff.debug.tokennew"); + print TOKENNEW join("***\n",@newwords); + close(TOKENNEW); + } + + print STDERR "(",exetime()," s)\n","Pass 1: Expanding text commands and merging isolated identities with changed blocks " if $verbose; + pass1(\@oldwords, \@newwords); + + + print STDERR "(",exetime()," s)\n","Pass 2: inserting DIF tokens and mark up. " if $verbose; + if ( $debug ) { + open(TOKENOLD,">","latexdiff.debug.tokenold2"); + print TOKENOLD join("***\n",@oldwords); + close(TOKENOLD); + open(TOKENNEW,">","latexdiff.debug.tokennew2"); + print TOKENNEW join("***\n",@newwords); + close(TOKENNEW); + } + + @retwords=pass2(\@oldwords, \@newwords); + + return(@retwords); +} + + + + +# @words=splitlatex($string) +# split string according to latex rules +# Each element of words is either +# a word (including trailing spaces and punctuation) +# a latex command +# if there is white space in the beginning return that as first token +sub splitlatex { + my ($inputstring) = @_ ; + my $string=$inputstring ; + # if input is empty, return empty list + length($string)>0 or return (); + $string=~s/^(\s*)//s; + my $leadin=$1; + length($string)>0 or return ($leadin); + + my @retval=($string =~ m/$pat/osg); + + if (length($string) != length(join("",@retval))) { + print STDERR "\nWARNING: Inconsistency in length of input string and parsed string:\n This often indicates faulty or non-standard latex code.\n In many cases you can ignore this and the following warning messages.\n Note that character numbers in the following are counted beginning after \\begin{document} and are only approximate." unless $ignorewarnings; + print STDERR "DEBUG Original length ",length($string)," Parsed length ",length(join("",@retval)),"\n" if $debug; + print STDERR "DEBUG Input string: |$string|\n" if (length($string)<500) && $debug; + print STDERR "DEBUG Token parsing: |",join("+",@retval),"|\n" if (length($string)<500) && $debug ; + @retval=(); + # slow way only do this if other m//sg method fails + my $last = 0; + while ( $string =~ m/$pat/osg ) { + my $match=$&; + if ($last + length $& != pos $string ) { + my $pos=pos($string); + my $offset=30<$last ? 30 : $last; + my $dum=substr($string,$last-$offset,$pos-$last+2*$offset); + my $dum1=$dum; + my $cnt=$#retval; + my $i; + $dum1 =~ s/\n/ /g; + unless ($ignorewarnings) { + print STDERR "\n$dum1\n"; + print STDERR " " x 30,"^" x ($pos-$last)," " x 30,"\n"; + print STDERR "Missing characters near word " . (scalar @retval) . " character index: " . $last . "-" . pos($string) . " Length: " . length($match) . " Match: |$match| (expected match marked above).\n"; + } + # put in missing characters `by hand' + push (@retval, substr($dum,$offset,$pos-$last-length($match))); +# Note: there seems to be a bug in substr with utf8 that made the following line output substr which were too long, +# using dum instead appears to work +# push (@retval, substr($string,$last, pos($string)-$last-length($match))); + } + push (@retval, $match); + $last=pos $string; + } + + } + unshift(@retval,$leadin) if (length($leadin)>0); + return @retval; +} + + +# pass1( \@seq1,\@seq2) +# Look for differences between seq1 and seq2. +# Where an common-subsequence block is flanked by deleted or appended blocks, +# and is shorter than $MINWORDSBLOCK words it is appended +# to the last deleted or appended word. If the block contains tokens other than words +# or punctuation it is not merged. +# Deleted or appended block consisting of words and safe commands only are +# also merged, to prevent break-up in pass2 (after previous isolated words have been removed) +# If there are commands with textual arguments (e.g. \caption) both in corresponding +# appended and deleted blocks split them such that the command and opening bracket +# are one token, then the rest is split up following standard rules, and the closing +# bracket is a separate token, ie. turn +# "\caption{This is a textual argument}" into +# ("\caption{","This ","is ","a ","textual ","argument","}") +# No return value. Destructively changes sequences +sub pass1 { + my $seq1 = shift ; + my $seq2 = shift ; + + my $len1 = scalar @$seq1; + my $len2 = scalar @$seq2; + my $wpat=qr/^(?:[a-zA-Z.,'`:;?()!]*)[\s~]*$/; #' + + my ($last1,$last2)=(-1,-1) ; + my $cnt=0; + my $block=[]; + my $addblock=[]; + my $delblock=[]; + my $todo=[]; + my $instruction=[]; + my $i; + my (@delmid,@addmid,@dummy); + + my ($addcmds,$delcmds,$matchindex); + my ($addtextblocks,$deltextblocks); + my ($addtokcnt,$deltokcnt,$mattokcnt)=(0,0,0); + my ($addblkcnt,$delblkcnt,$matblkcnt)=(0,0,0); + + my $adddiscard = sub { + if ($cnt > 0 ) { + $matblkcnt++; + # just after an unchanged block +# print STDERR "Unchanged block $cnt, $last1,$last2 \n"; + if ($cnt < $MINWORDSBLOCK + && $cnt==scalar ( + grep { /^$wpat/ || ( /^\\((?:[`'^"~=.]|[\w\d@*]+))((?:\[$brat_n\]|\{$pat_n\})*)/o + && iscmd($1,\@SAFECMDLIST,\@SAFECMDEXCL) + && scalar(@dummy=split(" ",$2))<3 ) } + @$block) ) { + # merge identical blocks shorter than $MINWORDSBLOCK + # and only containing ordinary words + # with preceding different word + # We cannot carry out this merging immediately as this + # would change the index numbers of seq1 and seq2 and confuse + # the algorithm, instead we store in @$todo where we have to merge + push(@$todo, [ $last1,$last2,$cnt,@$block ]); + } + $block = []; + $cnt=0; $last1=-1; $last2=-1; + } + }; + my $discard=sub { $deltokcnt++; + &$adddiscard; #($_[0],$_[1]); + push(@$delblock,[ $seq1->[$_[0]],$_[0] ]); + $last1=$_[0] }; + + my $add = sub { $addtokcnt++; + &$adddiscard; #($_[0],$_[1]); + push(@$addblock,[ $seq2->[$_[1]],$_[1] ]); + $last2=$_[1] }; + + my $match = sub { $mattokcnt++; + if ($cnt==0) { # first word of matching sequence after changed sequence or at beginning of word sequence + $deltextblocks = extracttextblocks($delblock); + $delblkcnt++ if scalar @$delblock; + $addtextblocks = extracttextblocks($addblock); + $addblkcnt++ if scalar @$addblock; + + # make a list of all TEXTCMDLIST commands in deleted and added blocks + $delcmds = extractcommands($delblock); + $addcmds = extractcommands($addblock); + # now find those text commands, which are found in both deleted and added blocks, and expand them + # keygen(third argument of _longestCommonSubsequence) implies to sort on command (0th elements of $addcmd elements) + # the calling format for longestCommonSubsequence has changed between versions of + # Algorithm::Diff so we need to check which one we are using + if ( $algodiffversion > 1.15 ) { + ### Algorithm::Diff 1.19 + $matchindex=Algorithm::Diff::_longestCommonSubsequence($delcmds,$addcmds, 0, sub { $_[0]->[0] } ); + } else { + ### Algorithm::Diff 1.15 + $matchindex=Algorithm::Diff::_longestCommonSubsequence($delcmds,$addcmds, sub { $_[0]->[0] } ); + } + + for ($i=0 ; $i<=$#$matchindex ; $i++) { + if (defined($matchindex->[$i])){ + $j=$matchindex->[$i]; + @delmid=splitlatex($delcmds->[$i][3]); + @addmid=splitlatex($addcmds->[$j][3]); + while (scalar(@$deltextblocks) && $deltextblocks->[0][0]<$delcmds->[$i][1]) { + my ($index,$block,$cnt)=@{ shift(@$deltextblocks) }; + push(@$todo, [$index,-1,$cnt,@$block]); + } + push(@$todo, [ $delcmds->[$i][1],-1,-1,$delcmds->[$i][2],@delmid,$delcmds->[$i][4]]); + + while (scalar(@$addtextblocks) && $addtextblocks->[0][0]<$addcmds->[$j][1]) { + my ($index,$block,$cnt)=@{ shift(@$addtextblocks) }; + push(@$todo, [-1,$index,$cnt,@$block]); + } + push(@$todo, [ -1,$addcmds->[$j][1],-1,$addcmds->[$j][2],@addmid,$addcmds->[$j][4]]); + } + } + # mop up remaining textblocks + while (scalar(@$deltextblocks)) { + my ($index,$block,$cnt)=@{ shift(@$deltextblocks) } ; + push(@$todo, [$index,-1,$cnt,@$block]); + } + while (scalar(@$addtextblocks)) { + my ($index,$block,$cnt)=@{ shift(@$addtextblocks) }; + push(@$todo, [-1,$index,$cnt,@$block]); + } + + $addblock=[]; + $delblock=[]; + } + push(@$block,$seq2->[$_[1]]); + $cnt++ }; + + my $keyfunc = sub { join(" ",split(" ",shift())) }; + + traverse_sequences($seq1,$seq2, { MATCH=>$match, DISCARD_A=>$discard, DISCARD_B=>$add }, $keyfunc ); + + + # now carry out the merging/splitting. Refer to elements relative from + # the end (with negative indices) as these offsets don't change before the instruction is executed + # cnt>0: merged small unchanged groups with previous changed blocks + # cnt==-1: split textual commands into components + foreach $instruction ( @$todo) { + ($last1,$last2,$cnt,@$block)=@$instruction ; + if ($cnt>=0) { + splice(@$seq1,$last1-$len1,1+$cnt,join("",$seq1->[$last1-$len1],@$block)) if $last1>=0; + splice(@$seq2,$last2-$len2,1+$cnt,join("",$seq2->[$last2-$len2],@$block)) if $last2>=0; + } else { + splice(@$seq1,$last1-$len1,1,@$block) if $last1>=0; + splice(@$seq2,$last2-$len2,1,@$block) if $last2>=0; + } + } + + if ($verbose) { + print STDERR "\n"; + print STDERR " $mattokcnt matching tokens in $matblkcnt blocks.\n"; + print STDERR " $deltokcnt discarded tokens in $delblkcnt blocks.\n"; + print STDERR " $addtokcnt appended tokens in $addblkcnt blocks.\n"; + } +} + + +# extracttextblocks(\@blockindex) +# $blockindex has the following format +# [ [ token1, index1 ], [token2, index2],.. ] +# where index refers to the index in the original old or new word sequence +# Returns: reference to an array of the form +# [[ $index, $textblock, $cnt ], .. +# where $index index of block to be merged +# $textblock contains all the words to be merged with the word at $index (but does not contain this word) +# $cnt is length of block +# +# requires: iscmd +# +sub extracttextblocks { + my $block=shift; + my ($i,$token,$index); + my $textblock=[]; + my $last=-1; + my $wpat=qr/^(?:[a-zA-Z.,'`:;?()!]*)[\s~]*$/; #' + my $retval=[]; + + for ($i=0;$i< scalar @$block;$i++) { + ($token,$index)=@{ $block->[$i] }; + # store pure text blocks + if ($token =~ /$wpat/ || ( $token =~/^\\((?:[`'^"~=.]|[\w\d@\*]+))((?:${extraspace}\[$brat_n\]${extraspace}|${extraspace}\{$pat_n\})*)/o + && iscmd($1,\@SAFECMDLIST,\@SAFECMDEXCL) + && !iscmd($1,\@TEXTCMDLIST,\@TEXTCMDEXCL))) { + # we have text or a command which can be treated as text + if ($last<0) { + # new pure-text block + $last=$index; + } else { + # add to pure-text block + push(@$textblock, $token); + } + } else { + # it is not text + if (scalar(@$textblock)) { + push(@$retval,[ $last, $textblock, scalar(@$textblock) ]); + } + $textblock=[]; + $last=-1; + } + } + # finish processing a possibly unfinished block before returning + if (scalar(@$textblock)) { + push(@$retval,[ $last, $textblock, scalar(@$textblock) ]); + } + return($retval) +} + + + +# extractcommands( \@blockindex ) +# $blockindex has the following format +# [ [ token1, index1 ], [token2, index2],.. ] +# where index refers to the index in the original old or new word sequence +# Returns: reference to an array of the form +# [ [ "\cmd1", index, "\cmd1[optarg]{arg1}{", "arg2" ,"} " ],.. +# where index is just taken from input array +# command must have a textual argument as last argument +# +# requires: iscmd +# +sub extractcommands { + my $block=shift; + my ($i,$token,$index,$cmd,$open,$mid,$closing); + my $retval=[]; + + for ($i=0;$i< scalar @$block;$i++) { + ($token,$index)=@{ $block->[$i] }; + # check if token is an alphanumeric command sequence with at least one non-optional argument + # \cmd[...]{...}{last argument} + # Capturing in the following results in these associations + # $1: \cmd[...]{...}{ + # $2: \cmd + # $3: last argument + # $4: } + trailing spaces + if ( ( $token =~ m/^(\\([\w\d\*]+)(?:${extraspace}\[$brat_n\]|${extraspace}\{$pat_n\})*${extraspace}\{)($pat_n)(\}\s*)$/so ) + && iscmd($2,\@TEXTCMDLIST,\@TEXTCMDEXCL) ) { + # push(@$retval,[ $2,$index,$1,$3,$4 ]); + ($cmd,$open,$mid,$closing) = ($2,$1,$3,$4) ; + $closing =~ s/\}/\\RIGHTBRACE/ ; + push(@$retval,[ $cmd,$index,$open,$mid,$closing ]); + } + } + return $retval; +} + +# iscmd($cmd,\@regexarray,\@regexexcl) checks +# return 1 if $cmd matches any of the patterns in the +# array $@regexarray, and none of the patterns in \@regexexcl, otherwise return 0 +sub iscmd { + my ($cmd,$regexar,$regexexcl)=@_; + my ($ret)=0; + foreach $pat ( @$regexar ) { + if ( $cmd =~ m/^${pat}$/ ) { + $ret=1 ; + last; + } + } + return 0 unless $ret; + foreach $pat ( @$regexexcl ) { + return 0 if ( $cmd =~ m/^${pat}$/ ); + } + return 1; +} + + +# pass2( \@seq1,\@seq2) +# Look for differences between seq1 and seq2. +# Mark begin and end of deleted and appended sequences with tags $DELOPEN and $DELCLOSE +# and $ADDOPEN and $ADDCLOSE, respectively, however exclude { } & and all comands, unless +# they match an element of the whitelist (SAFECMD) +# For words in TEXTCMD but not in SAFECMD, enclose interior with $ADDOPEN and $ADDCLOSE brackets +# Deleted comment lines are marked with %DIF < +# Added comment lines are marked with %DIF > +sub pass2 { + my $seq1 = shift ; + my $seq2 = shift ; + + my ($addtokcnt,$deltokcnt,$mattokcnt)=(0,0,0); + my ($addblkcnt,$delblkcnt,$matblkcnt)=(0,0,0); + + my $retval = []; + my $delhunk = []; + my $addhunk = []; + + my $discard = sub { $deltokcnt++; + push ( @$delhunk, $seq1->[$_[0]]) }; + + my $add = sub { $addtokcnt++; + push ( @$addhunk, $seq2->[$_[1]]) }; + + my $match = sub { $mattokcnt++; + if ( scalar @$delhunk ) { + $delblkcnt++; + # mark up changes, but comment out commands + push @$retval,marktags($DELMARKOPEN,$DELMARKCLOSE,$DELOPEN,$DELCLOSE,$DELCMDOPEN,$DELCMDCLOSE,$DELCOMMENT,$delhunk); + $delhunk = []; + } + if ( scalar @$addhunk ) { + $addblkcnt++; + # we mark up changes, but simply quote commands + push @$retval,marktags($ADDMARKOPEN,$ADDMARKCLOSE,$ADDOPEN,$ADDCLOSE,"","",$ADDCOMMENT,$addhunk); + $addhunk = []; + } + push(@$retval,$seq2->[$_[1]]) }; + + my $keyfunc = sub { join(" ",split(" ",shift())) }; + + traverse_sequences($seq1,$seq2, { MATCH=>$match, DISCARD_A=>$discard, DISCARD_B=>$add }, $keyfunc ); + # clear up unprocessed hunks + push @$retval,marktags($DELMARKOPEN,$DELMARKCLOSE,$DELOPEN,$DELCLOSE,$DELCMDOPEN,$DELCMDCLOSE,$DELCOMMENT,$delhunk) if scalar @$delhunk; + push @$retval,marktags($ADDMARKOPEN,$ADDMARKCLOSE,$ADDOPEN,$ADDCLOSE,"","",$ADDCOMMENT,$addhunk) if scalar @$addhunk; + + + if ($verbose) { + print STDERR "\n"; + print STDERR " $mattokcnt matching tokens. \n"; + print STDERR " $deltokcnt discarded tokens in $delblkcnt blocks.\n"; + print STDERR " $addtokcnt appended tokens in $addblkcnt blocks.\n"; + } + + return(@$retval); +} + +# marktags($openmark,$closemark,$open,$close,$opencmd,$closecmd,$comment,\@block) +# returns ($openmark,$open,$block,$close,$closemark) if @block contains no commands (except white-listed ones), +# braces, ampersands, or comments +# mark comments with $comment +# exclude all other exceptions from scope of open, close like this +# ($openmark, $open,...,$close, $opencmd,command, command,$closecmd, $open, ..., $close, $closemark) +# If $opencmd begins with "%" marktags assumes it is operating on a deleted block, otherwise on an added block +sub marktags { + my ($openmark,$closemark,$open,$close,$opencmd,$closecmd,$comment,$block)=@_; + my $word; + my (@argtext); + my $retval=[]; + my $noncomment=0; + my $cmd=-1; # -1 at beginning 0: last token written is a ordinary word + # 1: last token written is a command + # for keeping track whether we are just in a command sequence or in a word sequence + my $cmdcomment= ($opencmd =~ m/^%/); # Flag to indicate whether opencmd is a comment (i.e. if we intend to simply comment out changed commands) + my ($command,$commandword,$closingbracket) ; # temporary variables needed below to remember sub-pattern matches + +# split this block to flatten out sequences joined in pass1 + @$block=splitlatex(join "",@$block); + ### print STDERR "DEBUG: marktags $openmark,$closemark,$open,$close,$opencmd,$closecmd,$comment\n" if $debug; + ### print STDERR "DEBUG: marktags blocksplit ",join("|",@$block),"\n" if $debug; + foreach (@$block) { + $word=$_; + ### print STDERR "DEBUG MARKTAGS: |$word|\n" if $debug; + if ( $word =~ s/^%/%$comment/ ) { + # a comment + if ($cmd==1) { + push (@$retval,$closecmd) ; + $cmd=-1; + } + push (@$retval,$word); + next; + } + if ( $word =~ m/^\s*$/ ) { + ### print STDERR "DEBUG MARKTAGS: whitespace detected |$word| cmdcom |$cmdcomment| |$opencmd|\n" if $debug; + # a sequence of white-space characters - this should only ever happen for the first element of block. + # in deleted block, omit, otherwise just copy it in + if ( ! $cmdcomment) { # ignore in deleted blocks + push(@$retval,$word); + } + next; + } + if (! $noncomment) { + push (@$retval,$openmark); + $noncomment=1; + } + # negative lookahead pattern (?!) in second clause is put in to avoid matching \( .. \) patterns + # also note that second pattern will match \\ + ### print STDERR "DEBUG marktags: Considering word |$word|\n"; + if ( $word =~ /^[&{}\[\]]/ || ( $word =~ /^\\(?!\()(\\|[`'^"~=.]|[\w*@]+)/ && !iscmd($1,\@SAFECMDLIST,\@SAFECMDEXCL)) ) { + ###print STDERR "DEBUG MARKTAGS is a non-safe command ($1)\n" if $debug; + ### if ( $word =~ /^[&{}\[\]]/ || ( $word =~ /^\\([\w*@\\% ]+)/ && !iscmd($1,\@SAFECMDLIST,\@SAFECMDEXCL)) ) { + # word is a command or other significant token (not in SAFECMDLIST) + ## same conditions as in subroutine extractcommand: + # check if token is an alphanumeric command sequence with at least one non-optional argument + # \cmd[...]{...}{last argument} + # Capturing in the following results in these associations + # $1: \cmd[...]{...}{ + # $2: cmd + # $3: last argument + # $4: } + trailing spaces + ### pre-0.3 if ( ( $token =~ m/^(\\([\w\d\*]+)(?:\[$brat0\]|\{$pat_n\})*\{)($pat_n)(\}\s*)$/so ) + if ( ( $word =~ m/^(\\([\w\d\*]+)(?:${extraspace}\[$brat_n\]|${extraspace}\{$pat_n\})*${extraspace}\{)($pat_n)(\}\s*)$/so ) + && (iscmd($2,\@TEXTCMDLIST,\@TEXTCMDEXCL)|| iscmd($2,\@MATHTEXTCMDLIST,\@MATHTEXTCMDEXCL)) + && ( !$cmdcomment || !iscmd($2,\@CONTEXT2CMDLIST, \@CONTEXT2CMDEXCL) ) ) { + # Condition 1: word is a command? - if yes, $1,$2,.. will be set as above + # Condition 2: word is a text command - we mark up the interior of the word. There is a separate check for MATHTEXTCMDLIST + # because for $mathmarkup=WHOLE, the commands should not be split in pass1 (ie. math mode commands are not in + # TEXTCMDLIST, but the interior of MATHTEXT commands should be highlighted in both deleted and added blocks + # Condition 3: But if we are in a deleted block ($cmdcomment=1) and + # $2 (the command) is in context2, just treat it as an ordinary command (i.e. comment it open with $opencmd) + # Because we do not want to disable this command + # here we do not use $opencmd and $closecmd($opencmd is empty) + if ($cmd==1) { + push (@$retval,$closecmd) ; + } elsif ($cmd==0) { + push (@$retval,$close) ; + } + $command=$1; $commandword=$2; $closingbracket=$4; + @argtext=splitlatex($3); # split textual argument into tokens + # and mark it up (but we do not need openmark and closemark) + # insert command with initial arguments, marked-up final argument, and closing bracket + if ( $cmdcomment && iscmd($commandword,\@CONTEXT1CMDLIST, \@CONTEXT1CMDEXCL) ) { + # context1cmd in a deleted environment; delete command itself but keep last argument, marked up + push (@$retval,$opencmd); + $command =~ s/\n/\n${opencmd}/sg ; # repeat opencmd at the beginning of each line + # argument, note that the additional comment character is included + # to suppress linebreak after opening parentheses, which is important + # for latexrevise + push (@$retval,$command,"%\n{$AUXCMD\n",marktags("","",$open,$close,$opencmd,$closecmd,$comment,\@argtext),$closingbracket); + } elsif ( iscmd($commandword,,\@MATHTEXTCMDLIST, \@MATHTEXTCMDEXCL) ) { + # MATHBLOCK pseudo command: consider all commands safe, except & and \\ + # Keep these commands even in deleted blocks, hence set $opencmd and $closecmd (5th and 6th argument of marktags) to + # "" + local @SAFECMDLIST=(".*"); + local @SAFECMDEXCL=('\\','\\\\',@UNSAFEMATHCMD); + push(@$retval,$command,marktags("","",$open,$close,"","",$comment,\@argtext)#@argtext + ,$closingbracket); + } else { + # normal textcmd or context1cmd in an added block + push (@$retval,$command,marktags("","",$open,$close,$opencmd,$closecmd,$comment,\@argtext),$closingbracket); + } + push (@$retval,$AUXCMD,"\n") if $cmdcomment ; + $cmd=-1 ; + } else { + # ordinary command + push (@$retval,$opencmd) if $cmd==-1 ; + push (@$retval,$close,$opencmd) if $cmd==0 ; + $word =~ s/\n/\n${opencmd}/sg if $cmdcomment ; # if opencmd is a comment, repeat this at the beginning of every line + ### print STDERR "MARKTAGS: Add command |$word|\n"; + push (@$retval,$word); + $cmd=1; + } + } else { + ###print STDERR "DEBUG MARKTAGS is an ordinary word or SAFECMD command \n" if $debug; + # just an ordinary word or command in SAFECMD + push (@$retval,$open) if $cmd==-1 ; + push (@$retval,$closecmd,$open) if $cmd==1 ; + ###TODO: check here if it is a command in MBOXCMD list, and surround it with \mbox{...} + ### $word =~ /^\\(?!\()(\\|[`'^"~=.]|[\w*@]+)/ && iscmd($1,\@MBOXCMDLIST,\@MBOXCMDEXCL)) + ### but actually this check has been carried out already so can simply check if word begins with backslash + if ( $word =~ /^\\(?!\()(\\|[`'^"~=.]|[\w*@]+)(.*?)(\s*)$/s && iscmd($1,\@MBOXCMDLIST,\@MBOXCMDEXCL)) { + # $word is a safe command in MBOXCMDLIST + ###print STDERR "DEBUG Mboxsafecmd detected:$word:\n" if $debug ; + push(@$retval,"\\mbox{$AUXCMD\n\\" . $1 . $2 . $3 ."}\\hspace{0pt}$AUXCMD\n" ); + } else { + # $word is a normal word or a safe command (not in MBOXCMDLIST) + push (@$retval,$word); + } + $cmd=0; + } + } + push (@$retval,$close) if $cmd==0; + push (@$retval,$closecmd) if $cmd==1; + + push (@$retval,$closemark) if ($noncomment); + return @$retval; +} + +#used in preprocess +sub take_comments_and_enter_from_frac() { + #*************take the \n and % between frac and {}*********** + #notice all of the substitution are made none global + while( m/\\begin\{($MATHENV|$MATHARRENV|SQUAREBRACKET)}(.*?)\\frac(([\s]*%[^\n]*?)*[\r\n|\r|\n])+\{(.*?)\\end\{\1}/s ) { + # if there isn't any % or \n in the pattern $2 then there should be an \\end{...} in $2 + ### print STDERR "Match the following in take_comments and_enter_from_frac(1):\n****$&****\n" if $debug; + if( $2 !~ m/\\end\{$1}/s ) { + # take out % and \n from the next match only (none global) + s/\\begin\{($MATHENV|$MATHARRENV|SQUAREBRACKET)}(.*?)\\frac(([\s]*%[^\n]*?)*[\r\n|\r|\n])+\{(.*?)\\end\{\1}/\\begin{$1}$2\\frac{$5\\end{$1}/s; + } + else{ + #there are no more % and \n in $2, we want to find the next one so we clear the begin-end from the pattern + s/\\begin\{($MATHENV|$MATHARRENV|SQUAREBRACKET)}(.*?)\\end\{\1}/MATHBLOCK$1\{$2\}MATHBLOCKEND/s; + } + } + ###cleaning up + while( s/MATHBLOCK($MATHENV|$MATHARRENV|SQUAREBRACKET)\{(.*?)\}MATHBLOCKEND/\\begin{$1}$2\\end{$1}/s ){} + ###*************take the \n and % between frac and {}*********** + + ###**********take the \n and % between {} and {} of the frac*************** + while( m/\\begin\{($MATHENV|$MATHARRENV|SQUAREBRACKET)\}(.*?)\\frac\{(.*?)\\end\{\1\}/s ) { + # if there isn't any more //frac before the first //end in the pattern $2 then there should be an \\end{...} in $2 + ###print STDERR "Match the following in take_comments and_enter_from_frac(2):\n****$&****\n" if $debug; + if( $2 !~ m/\\end\{$1\}/s ) { + # from now on CURRFRAC is the frac we are looking at + s/\\begin\{($MATHENV|$MATHARRENV|SQUAREBRACKET)\}(.*?)\\frac\{(.*?)\\end\{\1\}/\\begin\{$1\}$2CURRFRAC\{$3\\end\{$1\}/s; + while( m/\\begin\{($MATHENV|$MATHARRENV|SQUAREBRACKET)\}(.*?)CURRFRAC\{(.*?)\\end\{\1\}/s ) { + if( m/\\begin\{($MATHENV|$MATHARRENV|SQUAREBRACKET)\}(.*?)CURRFRAC\{($pat_n)\}([\s]*(%[^\n]*?)*[\r\n|\r|\n])+[\s]*\{(.*?)\\end\{\1}/s ) { + s/\\begin\{($MATHENV|$MATHARRENV|SQUAREBRACKET)\}(.*?)CURRFRAC\{($pat_n)\}([\s]*(%[^\n]*?)*[\r\n|\r|\n])+[\s]*\{(.*?)\\end\{\1\}/\\begin\{$1\}$2CURRFRAC\{$3\}\{$6\\end\{$1\}/s; + } + else { # there is no comment or \n between the two brackets {}{} + # change CURRFRAC to FRACSTART so we can change them all back to //frac{ when we finish + s/\\begin\{($MATHENV|$MATHARRENV|SQUAREBRACKET)}(.*?)CURRFRAC\{(.*?)\\end\{\1}/\\begin{$1}$2FRACSTART\{$3\\end{$1}/s; + } + } + } + else{ + ###there are no more frac in $2, we want to find the next one so we clear the begin-end from the pattern + s/\\begin\{($MATHENV|$MATHARRENV|SQUAREBRACKET)}(.*?)\\end\{\1}/MATHBLOCK$1\{$2\}MATHBLOCKEND/s; + } + + } + ###cleaning up + while( s/MATHBLOCK($MATHENV|$MATHARRENV|SQUAREBRACKET)\{(.*?)\}MATHBLOCKEND/\\begin{$1}$2\\end{$1}/s ){} + s/FRACSTART/\\frac/g; + ###***************take the \n and % between {} and {} of the frac********************* +} + +# preprocess($string, ..) +# carry out the following pre-processing steps for all arguments: +# 1. Remove leading white-space +# Change \{ to \QLEFTBRACE and \} to \QRIGHTBRACE and \& to \AMPERSAND +# #. Change {,} in comments to \CLEFTBRACE, \CRIGHTBRACE +# 2. mark all first empty line (in block of several) with \PAR tokens +# 3. Convert all '\%' into '\PERCENTAGE ' and all '\$' into \DOLLAR to make parsing regular expressions easier +# 4. Convert all \verb|some verbatim text| commands (where | can be an arbitrary character) +# into \verb{hash} (also lstinline) +# 5. Convert \begin{verbatim} some verbatim text \end{verbatim} into \verbatim{hash} (not only verbatim, all patterns matching VERBATIMENV) +# 6. Convert _n into \SUBSCRIPTNB{n} and _{nnn} into \SUBSCRIPT{nn} +# 7. Convert ^n into \SUPERSCRIPTNB{n} and ^{nnn} into \SUPERSCRIPT{nn} +# 8. a. Convert $$ $$ into \begin{DOLLARDOLLAR} \end{DOLLARDOLLAR} +# b. Convert \[ \] into \begin{SQUAREBRACKET} \end{SQUAREBRACKET} +# 9. Convert all picture environmentent (\begin{PICTUREENV} .. \end{PICTUREENV} \PICTUREBLOCKenv +# For math-mode COARSE,WHOLE or NONE option -convert all \begin{MATH} .. \end{MATH} +# into \MATHBLOCKmath{...} commands, where MATH/math is any valid math environment + +# 10. Add final token STOP to the very end. This is put in because the algorithm works better if the last token is identical. This is removed again in postprocessing. +# +# NB: step 6 and 7 is likely to convert some "_" inappropriately, e.g. in file +# names or labels but it does not matter because they are converted back in the postprocessing step +# Returns: leading white space removed in step 1 +sub preprocess { + for (@_) { + + + # change in \verb and similar commands - note that I introduce an extra space here so that the + # already hashed variants do not trigger again + # transform \lstinline{...} +# s/\\lstinline(\[$brat0\])?(\{(?:.*?)\})/"\\DIFlstinline". $1 ."{". tohash(\%verbhash,"$2") ."}"/esg; +# s/\\lstinline(\[$brat0\])?((\S).*?\2)/"\\DIFlstinline". $1 ."{". tohash(\%verbhash,"$2") ."}"/esg; + + # Mark inline-verb in commented lines to be COMMENTverb (no hashing, no marking with color) + 1 while s/((?{$hstr}) && $string ne $hash->{$hstr}); + # else found a duplicate HASH need to repeat for a higher hash value + } + $hash->{$hstr}=$string; + ### print STDERR "Hash:$hstr: Content:$string:\n"; + return($hstr); +} + +#string=fromhash(\%hash,$fromstring) +# restores string value stored in hash +#string=fromhash(\%hash,$fromstring,$prependstring) +# additionally begins each line with prependstring +sub fromhash { + my ($hash,$hstr)=($_[0],$_[1]); + my $retstr=$hash->{$hstr}; + if ( $#_ >= 2) { + $retstr =~ s/^/$_[2]/mg; + } + return $retstr; +} + + +# postprocess($string, ..) +# carry out the following post-processing steps for all arguments: +# * Remove STOP token from the end +# * Replace \RIGHTBRACE by } +# * change citation commands within comments to protect from processing (using marker CITEDIF) +# 1. Check all deleted blocks: +# a.where a deleted block contains a matching \begin and +# \end environment (these will be disabled by a %DIFDELCMD statements), for selected environments enable +# these commands again (such that for example displayed math in a deleted equation +# is properly within math mode. For math mode environments replace numbered equation +# environments with their display only variety (so that equation numbers in new file and +# diff file are identical). Where the correct type of math environment cannot be determined +# use a place holder MATHMODE +# b.where one of the commands matching $COUNTERCMD is used as a DIFAUXCMD, add a statement +# subtracting one from the respective counter to keep numbering consistent with new file +# Replace all MATHMODE environment commands by the correct environment to achieve matching +# pairs +# c. Convert MATHBLOCKmath commands to their uncounted numbers (e.g. convert equation -> displaymath +# (environments defined in $MATHENV will be replaced by $MATHREPL, and environments in $MATHARRENV +# will be replaced by $MATHARRREPL +# d. If in-line math mode contains array environment, enclose the whole environment in \mbox'es +# d. place \cite commands in mbox'es (for UNDERLINE style) +# +# For added blocks: +# c. If in-line math mode contains array environment, enclose the whole environment in \mbox'es +# d. place \cite commands in mbox'es (for UNDERLINE style) +# +# 2. If math-mode COARSE,WHOLE or NONE option set: Convert \MATHBLOCKmath{..} commands back to environments +# +# Convert all PICTUREblock{..} commands back to the appropriate environments +# 3. Convert DIFadd, DIFdel, DIFaddbegin , ... into FL varieties +# within floats (currently recognised float environments: plate,table,figure +# plus starred varieties). +# 4. Remove empty %DIFDELCMD < lines +# 4. Convert \begin{SQUAREBRACKET} \end{SQUAREBRACKET} into \[ \] +# Convert \begin{DOLLARDOLLAR} \end{DOLLARDOLLAR} into $$ $$ +# 5. Convert \SUPERSCRIPTNB{n} into ^n and \SUPERSCRIPT{nn} into ^{nnn} +# 6. Convert \SUBSCRIPTNB{n} into _n and \SUBCRIPT{nn} into _{nnn} +# 7. Expand hashes of verb and verbatim environments +# 8. Convert '\PERCENTAGE ' back into '\%' and '\DOLLAR ' into '\$' +# 9.. remove all \PAR tokens +# 10. package specific processing: endfloat: make sure \begin{figure} and \end{figure} are always +# on a line by themselves, similarly for table environment +# 4, undo renaming of the \begin, \end,{,} in comments +# Change \QLEFTBRACE, \QRIGHTBRACE,\AMPERSAND to \{,\},\& +# +# Note have to manually synchronize substitution commands below and +# DIF.. command names in the header +sub postprocess { + my ($begin,$len,$cnt,$float,$delblock,$addblock); + # second level blocks + my ($begin2,$cnt2,$len2,$eqarrayblock,$mathblock); + + my (@textparts,@newtextparts,@liststack,$listtype,$listlast); + + for (@_) { + + # change $'s in comments to something harmless + 1 while s/(%.*)\$/$1DOLLARDIF/mg ; + + # Remove final STOP token + s/ STOP$//; + # Replace \RIGHTBRACE in comments by \MBLOCKRIGHTBRACE + # the only way to get these is as %DIFDELCMD < \RIGHTBRACE construction + # This essentially marks closing right braces of MATHBLOCK environments, which did not get matched + # up. This case should be rare, so I just leave this in the diff file output. Not really elegant + # but can still be dealt with later if it results in problems. + s/%DIFDELCMD < \\RIGHTBRACE/%DIFDELCMD < \\MBLOCKRIGHTBRACE/g ; + # Replace \RIGHTBRACE by } + s/\\RIGHTBRACE/}/g; + + # Check all deleted blocks: where a deleted block contains a matching \begin and + # \end environment (these will be disabled by a %DIFDELCMD statements), enable + # these commands again (such that for example displayed math in a deleted equation + # is properly within math mode). For math mode environments replace numbered equation + # environments with their display only variety (so that equation numbers in new file and + # diff file are identical) + while ( m/\\DIFdelbegin.*?\\DIFdelend/sg ) { + $cnt=0; + $len=length($&); + $begin=pos($_) - $len; + $delblock=$&; + + + ### (.*?[^\n]?)\n? construct is necessary to avoid empty lines in math mode, which result in + ### an error + # displayed math environments + if ($mathmarkup == FINE ) { + $delblock=~ s/(\%DIFDELCMD < \s*\\begin\{((?:$MATHENV)|SQUAREBRACKET)\}.*?(?:$DELCMDCLOSE|\n))(.*?[^\n]?)\n?(\%DIFDELCMD < \s*\\end\{\2\})/\\begin{$MATHREPL}$AUXCMD\n$1$3\n\\end{$MATHREPL}$AUXCMD\n$4/sg; + # also transform the opposite pair \end{displaymath} .. \begin{displaymath} but we have to be careful not to interfere with the results of the transformation in the line directly above + ### pre-0.42 obsolete version which did not work on eqnarray test $delblock=~ s/(? displaymath +# (environments defined in $MATHENV will be replaced by $MATHREPL, and environments in $MATHARRENV +# will be replaced by $MATHARRREPL + $delblock=~ s/\\MATHBLOCK($MATHENV)\{($pat_n)\}/\\MATHBLOCK$MATHREPL\{$2\}/sg; + $delblock=~ s/\\MATHBLOCK($MATHARRENV)\{($pat_n)\}/\\MATHBLOCK$MATHARRREPL\{$2\}/sg; + } + # Reinstate completely deleted list environments. note that items within the + # environment will still be commented out. They will be restored later + $delblock=~ s/(\%DIFDELCMD < \s*\\begin\{($LISTENV)\}\s*?(?:\n|$DELCMDCLOSE))(.*?)(\%DIFDELCMD < \s*\\end\{\2\})/{ + ### # block within the search; replacement environment + ### "$1\\begin{$2}$AUXCMD\n". restore_item_commands($3). "\n\\end{$2}$AUXCMD\n$4"; + "$1\\begin{$2}$AUXCMD\n$3\n\\end{$2}$AUXCMD\n$4"; + }/esg; + + +# b.where one of the commands matching $COUNTERCMD is used as a DIFAUXCMD, add a statement +# subtracting one from the respective counter to keep numbering consistent with new file + $delblock=~ s/\\($COUNTERCMD)((?:${extraspace}\[$brat_n\]${extraspace}|${extraspace}\{$pat_n\})*\s*${AUXCMD}\n)/\\$1$2\\addtocounter{$1}{-1}${AUXCMD}\n/sg ; + +# bb. disable active labels within deleted blocks (as these are not safe commands, this should normally only +# happen within deleted maths blocks + $delblock=~ s/(?>>\n" if $debug; + + + # make the array modification in added blocks + while ( m/\\DIFaddbegin.*?\\DIFaddend/sg ) { + $cnt=0; + $len=length($&); + $begin=pos($_) - $len; + $addblock=$&; + while ( $addblock =~ m/($math)(\s*)/sg ) { + $cnt2=0; + $len2=length($&); + $begin2=pos($addblock) - $len2; + $mathblock="%\n\\mbox{$AUXCMD\n$1\n}$AUXCMD\n"; + next unless ( $mathblock =~ /ARRAYBLOCK/ or $mathblock =~ m/\{$ARRENV\}/) ; + substr($addblock,$begin2,$len2)=$mathblock; + pos($addblock) = $begin2 + length($mathblock); + } + # if MBOXINLINEMATH is set, protect inlined math environments with an extra mbox + if ( $MBOXINLINEMATH ) { + ##$addblock=~s/($math)/\\mbox{$AUXCMD\n$1\n}$AUXCMD\n/sg; + $addblock=~s/($math)(?:[\s\n]*)?/\\mbox{$AUXCMD\n$1\n}$AUXCMD\n/sg; + } + ###if ( defined($packages{"listings"} and $latexdiffpreamble =~ /\\RequirePackage(?:\[$brat0\])?\{color\}/)) { + # mark added verbatim commands + $addblock =~ s/\\DIFverb/\\DIFDIFaddverb/g; + $addblock =~ s/\\DIF($LSTINLINEENV)/\\DIFDIFadd$1/g; + if( $CUSTOMDIFCMD ) { + $addblock =~ s/\\($CUSTOMDIFCMD)/\\ADD$1/g; + } + ###} +# splice in modified addblock + substr($_,$begin,$len)=$addblock; + pos = $begin + length($addblock); + } + + # Go through whole text, and by counting list environment commands, find out when we are within a list environment. + # Within those restore deleted \item commands + @textparts=split /(? 0) { + $listlast=pop(@liststack); + ($listtype eq $listlast) or warn "Invalid nesting of list environments: $listlast environment closed by \\end{$listtype}."; + } else { + warn "WARNING: Invalid nesting of list environments: \\end{$listtype} encountered without matching \\begin{$listtype}.\n"; + } + } else { + print STDERR "DEBUG: postprocess \@liststack=(",join(",",@liststack),")\n" if $debug; + if (scalar @liststack > 0 ) { + # we are within a list environment and should replace all item commands + $_=restore_item_commands($_); + } + # else: we are outside a list environment and do not need to do anything + } + $_ } @textparts; # end of map command + # replace the main text with the modified version + $_= join("",@newtextparts); + + + + + # Replace MATHMODE environments from step 1a above by the correct Math environment + + # The next line is complicated. The negative look-ahead insertion makes sure that no \end{$MATHENV} (or other mathematical + # environments) are between the \begin{$MATHENV} and \end{MATHMODE} commands. This is necessary as the minimal matching + # is not globally minimal but only 'locally' (matching is beginning from the left side of the string) + if ( $mathmarkup == FINE ) { + 1 while s/\\begin\{((?:$MATHENV)|(?:$MATHARRENV)|SQUAREBRACKET)}((?:.(?!(?:\\end\{(?:(?:$MATHENV)|(?:$MATHARRENV)|SQUAREBRACKET)}|\\begin\{MATHMODE})))*?)\\end\{MATHMODE}/\\begin{$1}$2\\end{$1}/s; + 1 while s/\\begin\{MATHMODE}((?:.(?!\\end\{MATHMODE}))*?)\\end\{((?:$MATHENV)|(?:$MATHARRENV)|SQUAREBRACKET)}/\\begin{$2}$1\\end{$2}/s; + # convert remaining \begin{MATHMODE} \end{MATHMODE} (and not containing & or \\ )into MATHREPL environments + s/\\begin\{MATHMODE\}((?:(.(?!(? )([^\n]*?\n)/"${1}" . escape_command(${2}, "(?:plc|textnormal|textsubscript|textsl)", "@\\DIFadd{", "}@")/esg; + s/}\\glossarydef(start|end)/}\n\\glossarydef\1\n/g; + s/\\\\\s+\\DIFaddend\s+\\end\{supertabular\}/\\DIFaddend \\\\\n\\end{supertabular}/gm; + + return; + } +} + +sub escape_special { + my ($text) = @_; + $text =~ s/\\/\\\\ /g; + return $text; +} + +sub escape_command { + my ($text, $command, $prefix, $suffix) = @_; + $text =~ s/(\\$command)(\{$pat_n\})/"${prefix}${1}". escape_special(${2}) ."${suffix}"/esg; + return $text; +} + +# $out = restore_item_commands($listenviron) +# short helper function for post-process, which restores deleted \item commands in its argument (as DIFAUXCMDs) +sub restore_item_commands { + my ($string)=@_ ; + my ($itemarg,@itemargs); + $string =~ s/(\%DIFDELCMD < \s*(\\$ITEMCMD)((?:<$abrat0>)?)((?:\[$brat_n\])?)\s*((?:${cmdoptseq}\s*?)*)(?:\n|$DELCMDCLOSE))/ + # if \item has an []argument, then mark up the argument as deleted) + if (length($4)>0) { + # use substr to exclude square brackets at end points + @itemargs=splitlatex(substr($4,1,length($4)-2)); + $itemarg="[".join("",marktags("","",$DELOPEN,$DELCLOSE,$DELCMDOPEN,$DELCMDCLOSE,$DELCOMMENT,\@itemargs))."]"; + } else { + $itemarg=""; + } + "$1$2$3$itemarg$AUXCMD\n"; ###.((length($5)>0) ? "%DIFDELCMD $5 $DELCMDCLOSE\n" : "") + /sge; + return($string); +} + + +# @auxlines=preprocess_preamble($oldpreamble,$newpreamble); + # pre-process preamble by looking for commands used in \maketitle (title, author, date etc commands) + # the list of commands is defined in CONTEXT2CMD + # if found then use a bodydiff to mark up content, and replace the corresponding commands + # in both preambles by marked up version to 'fool' the linediff (such that only body is marked + # up. + # A special case are e.g. author commands being added (or removed) + # 1. If commands are added, then the entire content is marked up as new, but also the lines are marked as new in the linediff + # 2. If commands are removed, then the linediff will mark the line as deleted. The program returns + # with $auxlines a text to be appended at the end of the preamble, which shows the respective fields as deleted +sub preprocess_preamble { + my ($oldpreambleref,$newpreambleref)=(\$_[0],\$_[1]) ; + my @auxlines=(); + # Remember to use $$oldpreambleref to refer to oldpreamble + my ($titlecmd,$titlecmdpat); + my (@oldtitlecommands,@newtitlecommands ); + my %oldhash = (); + my %newhash = (); + my ($line,$cmd,$optarg,$arg,$optargnew,$optargold,$optargdiff,$argold,$argnew,$argdiff,$auxline); + + my $warnmsgdetail = <[1])) { + $optargnew=$newhash{$cmd}->[1]; + } else { + $optargnew=""; + } + if ( defined($oldhash{$cmd}->[1])) { + $optargold=$oldhash{$cmd}->[1]; + } else { + $optargold=""; + } + + if ( defined($oldhash{$cmd}->[2]) ) { + $argold=$oldhash{$cmd}->[2]; + } else { + $argold=""; + } + $argnew=$newhash{$cmd}->[2]; + $argdiff="{" . join("",bodydiff($argold,$argnew)) ."}"; + if ( length $optargnew ) { + $optargdiff="[".join("",bodydiff($optargold,$optargnew))."]" ; + $optargdiff =~ s/\\DIFaddbegin /\\DIFaddbeginFL /g; + $optargdiff =~ s/\\DIFaddend /\\DIFaddendFL /g; + $optargdiff =~ s/\\DIFadd\{/\\DIFaddFL{/g; + $optargdiff =~ s/\\DIFdelbegin /\\DIFdelbeginFL /g; + $optargdiff =~ s/\\DIFdelend /\\DIFdelendFL /g; + $optargdiff =~ s/\\DIFdel\{/\\DIFdelFL{/g; + } else { + $optargdiff=""; + } + ### print STDERR "DEBUG s/\\Q$newhash{$cmd}->[0]\\E/\\$cmd$optargdiff$argdiff/s\n"; + # Note: \Q and \E force literal interpretation of what it between them but allow + # variable interpolation, such that e.g. \title matches just that and not TAB-itle + $$newpreambleref=~s/\Q$newhash{$cmd}->[0]\E/\\$cmd$optargdiff$argdiff/s; + # replace this in old preamble if necessary + if ( defined($oldhash{$cmd}->[0])) { + $$oldpreambleref=~s/\Q$oldhash{$cmd}->[0]\E/\\$cmd$optargdiff$argdiff/s ; + } + ### print STDERR "DEBUG NEW PRE ".$$newpreambleref."\n"; + } + + foreach $cmd ( keys %oldhash ) { + # if this has already been dealt with above can just skip + next if defined($newhash{$cmd}) ; + $argold=$oldhash{$cmd}->[2]; + $argdiff="{" . join("",bodydiff($argold,"")) ."}"; + if ( defined($oldhash{$cmd}->[1])) { + $optargold=$oldhash{$cmd}->[1]; + $optargdiff="[".join("",bodydiff($optargold,""))."]" ; + $optargdiff =~ s/\\DIFdelbegin /\\DIFdelbeginFL /g; + $optargdiff =~ s/\\DIFdelend /\\DIFdelendFL /g; + $optargdiff =~ s/\\DIFdel\{/\\DIFdelFL{/g; + } else { + $optargdiff=""; + } + $auxline = "\\$cmd$optargdiff$argdiff"; + $auxline =~s/$/$AUXCMD/sg; + push @auxlines,$auxline; + } + # add auxcmd comment to highlight added lines + return(@auxlines); +} + + + +# @diffs=linediff(\@seq1, \@seq2) +# mark up lines like this +#%DIF mm-mmdnn +#%< old deleted line(s) +#%DIF ------- +#%DIF mmann-nn +#new appended line %< +#%DIF ------- +# Future extension: mark change explicitly +# Assumes: traverse_sequence traverses deletions before insertions in changed sequences +# all line numbers relative to line 0 (first line of real file) +sub linediff { + my $seq1 = shift ; + my $seq2 = shift ; + + my $block = []; + my $retseq = []; + my @begin=('','',''); # dummy initialisation + my $instring ; + + my $discard = sub { @begin=('d',$_[0],$_[1]) unless scalar @$block ; + push(@$block, "%DIF < " . $seq1->[$_[0]]) }; + my $add = sub { if (! scalar @$block) { + @begin=('a',$_[0],$_[1]) ;} + elsif ( $begin[0] eq 'd' ) { + $begin[0]='c'; $begin[2]=$_[1]; + push(@$block, "%DIF -------") } + push(@$block, $seq2->[$_[1]] . " %DIF > " ) }; + my $match = sub { if ( scalar @$block ) { + if ( $begin[0] eq 'd' && $begin[1]!=$_[0]-1) { + $instring = sprintf "%%DIF %d-%dd%d",$begin[1],$_[0]-1,$begin[2]; } + elsif ( $begin[0] eq 'a' && $begin[2]!=$_[1]-1) { + $instring = sprintf "%%DIF %da%d-%d",$begin[1],$begin[2],$_[1]-1; } + elsif ( $begin[0] eq 'c' ) { + $instring = sprintf "%%DIF %sc%s", + ($begin[1]==$_[0]-1) ? "$begin[1]" : $begin[1]."-".($_[0]-1) , + ($begin[2]==$_[1]-1) ? "$begin[2]" : $begin[2]."-".($_[1]-1) ; } + else { + $instring = sprintf "%%DIF %d%s%d",$begin[1],$begin[0],$begin[2]; } + push @$retseq, $instring,@$block, "%DIF -------" ; + $block = []; + } + push @$retseq, $seq2->[$_[1]] + }; + # key function: remove multiple spaces (such that insertion or deletion of redundant white space is not reported) + my $keyfunc = sub { join(" ",split(" ",shift())) }; + + traverse_sequences($seq1,$seq2, { MATCH=>$match, DISCARD_A=>$discard, DISCARD_B=>$add }, $keyfunc ); + push @$retseq, @$block if scalar @$block; + + return wantarray ? @$retseq : $retseq ; +} + + + +# init_regex_arr_data(\@array,"TOKEN INIT") +# scans DATA file handel for line "%% TOKEN INIT" line +# then appends each line not beginning with % into array (as a quoted regex) +# This is used for command lists and configuration variables, but the processing is slightly +# different: +# For lists, the regular expression is extended to include beginning (^) and end ($) markers, to require full-string matching +# For configuration variables (and all others), simply an unadorned list is copied +sub init_regex_arr_data { + my ($arr,$token)=@_; + my $copy=0; + my ($mode); + if ($token =~ m/COMMANDS/ ) { + $mode=0; + } else { + $mode=1; + } + + while () { + if ( m/^%%BEGIN $token\s*$/ ) { + $copy=1; + next; + } elsif ( m/^%%END $token\s*$/ ) { + last; } + chomp; + if ( $mode==0 ) { + push (@$arr,qr/^$_$/) if ( $copy && !/^%/ ) ; + } elsif ($mode==1) { + push (@$arr,"$_") if ( $copy && !/^%/ ) ; + } + } + seek DATA,0,0; # rewind DATA handle to file begin +} + + +# init_regex_arr_ext(\@array,$arg) +# appends array with regular expressions. +# if arg is a file name, then read in list of regular expressions from that file +# (one expression per line) +# Otherwise treat arg as a comma separated list of regular expressions +sub init_regex_arr_ext { + my ($arr,$arg)=@_; + if ( -f $arg ) { + init_regex_arr_file($arr,$arg); + } else { + init_regex_arr_list($arr,$arg); + } +} + +# init_regex_arr_file(\@array,$fname) +# appends array with regular expressions. +# Read in list of regular expressions from $fname +# (one expression per line) +sub init_regex_arr_file { + my ($arr,$fname)=@_; + open(FILE,"$fname") or die ("Couldn't open $fname: $!"); + while () { + chomp; + next if /^\s*#/ || /^\s*%/ || /^\s*$/ ; + push (@$arr,qr/^$_$/); + } + close(FILE); +} + +# init_regex_arr_list(\@array,$arg) +# appends array with regular expressions. +# read from comma separated list of regular expressions ($arg) +sub init_regex_arr_list { + my ($arr,$arg)=@_; + my $regex; + ### print STDERR "DEBUG init_regex_arr_list arg >$arg<\n" if $debug; + foreach $regex (split(qr/(?=1) { + $reset=shift; + } + if ($reset) { + $lasttime=times(); + } + else { + $retval=times()-$lasttime; + $lasttime=$lasttime+$retval; + return($retval); + } +} + + +sub usage { + die <<"EOF"; +Usage: $0 [options] old.tex new.tex > diff.tex + +Compares two latex files and writes tex code to stdout, which has the same format as new.tex but +has all changes relative to old.tex marked up or commented. Note that old.tex and new.tex need to +be real files (not pipes or similar) as they are opened twice. + +--type=markupstyle +-t markupstyle Add code to preamble for selected markup style + Available styles: UNDERLINE CTRADITIONAL TRADITIONAL CFONT FONTSTRIKE INVISIBLE + CHANGEBAR CCHANGEBAR CULINECHBAR CFONTCBHBAR BOLD PDFCOMMENT + [ Default: UNDERLINE ] + +--subtype=markstyle +-s markstyle Add code to preamble for selected style for bracketing + commands (e.g. to mark changes in margin) + Available styles: SAFE MARGIN DVIPSCOL COLOR ZLABEL ONLYCHANGEDPAGE (LABEL)* + [ Default: SAFE ] + * LABEL subtype is deprecated + +--floattype=markstyle +-f markstyle Add code to preamble for selected style which + replace standard marking and markup commands within floats + (e.g., marginal remarks cause an error within floats + so marginal marking can be disabled thus) + Available styles: FLOATSAFE IDENTICAL + [ Default: FLOATSAFE ] + +--encoding=enc +-e enc Specify encoding of old.tex and new.tex. Typical encodings are + ascii, utf8, latin1, latin9. A list of available encodings can be + obtained by executing + perl -MEncode -e 'print join ("\\n",Encode->encodings( ":all" )) ;' + [Default encoding is utf8 unless the first few lines of the preamble contain + an invocation "\\usepackage[..]{inputenc} in which case the + encoding chosen by this command is asssumed. Note that ASCII (standard + latex) is a subset of utf8] + +--preamble=file +-p file Insert file at end of preamble instead of auto-generating + preamble. The preamble must define the following commands + \\DIFaddbegin,\\DIFaddend,\\DIFadd{..}, + \\DIFdelbegin,\\DIFdelend,\\DIFdel{..}, + and varieties for use within floats + \\DIFaddbeginFL,\\DIFaddendFL,\\DIFaddFL{..}, + \\DIFdelbeginFL,\\DIFdelendFL,\\DIFdelFL{..} + (If this option is set -t, -s, and -f options + are ignored.) + +--exclude-safecmd=exclude-file +--exclude-safecmd="cmd1,cmd2,..." +-A exclude-file +--replace-safecmd=replace-file +--append-safecmd=append-file +--append-safecmd="cmd1,cmd2,..." +-a append-file Exclude from, replace or append to the list of regex + matching commands which are safe to use within the + scope of a \\DIFadd or \\DIFdel command. The file must contain + one Perl-RegEx per line (Comment lines beginning with # or % are + ignored). A literal comma within the comma-separated list must be + escaped thus "\\,", Note that the RegEx needs to match the whole of + the token, i.e., /^regex\$/ is implied and that the initial + "\\" of the command is not included. The --exclude-safecmd + and --append-safecmd options can be combined with the --replace-safecmd + option and can be used repeatedly to add cumulatively to the lists. + +--exclude-textcmd=exclude-file +--exclude-textcmd="cmd1,cmd2,..." +-X exclude-file +--replace-textcmd=replace-file +--append-textcmd=append-file +--append-textcmd="cmd1,cmd2,..." +-x append-file Exclude from, replace or append to the list of regex + matching commands whose last argument is text. See + entry for --exclude-safecmd directly above for further details. + +--replace-context1cmd=replace-file +--append-context1cmd=append-file +--append-context1cmd="cmd1,cmd2,..." + Replace or append to the list of regex matching commands + whose last argument is text but which require a particular + context to work, e.g. \\caption will only work within a figure + or table. These commands behave like text commands, except when + they occur in a deleted section, when they are disabled, but their + argument is shown as deleted text. + +--replace-context2cmd=replace-file +--append-context2cmd=append-file +--append-context2cmd="cmd1,cmd2,..." + As corresponding commands for context1. The only difference is that + context2 commands are completely disabled in deleted sections, including + their arguments. + context2 commands are also the only commands in the preamble, whose argument will + be processed in word-by-word mode (which only works, if they occur no more than + once in the preamble). + +--exclude-mboxsafecmd=exclude-file +--exclude-mboxsafecmd="cmd1,cmd2,..." +--append-mboxsafecmd=append-file +--append-mboxsafecmd="cmd1,cmd2,..." + Define safe commands, which additionally need to be protected by encapsulating + in an \\mbox{..}. This is sometimes needed to get around incompatibilities + between external packages and the ulem package, which is used for highlighting + in the default style UNDERLINE as well as CULINECHBAR CFONTSTRIKE + + + +--config var1=val1,var2=val2,... +-c var1=val1,.. Set configuration variables. +-c configfile Available variables: + ARRENV (RegEx) + COUNTERCMD (RegEx) + FLOATENV (RegEx) + ITEMCMD (RegEx) + LISTENV (RegEx) + MATHARRENV (RegEx) + MATHARRREPL (String) + MATHENV (RegEx) + MATHREPL (String) + MINWORDSBLOCK (Integer) + PICTUREENV (RegEx) + SCALEDELGRAPHICS (Float) + VERBATIMENV (RegEx) + VERBATIMLINEENV (RegEx) + LSTINLINEENV (RegEx) + CUSTOMDIFCMD (RegEx) + This option can be repeated. + +--add-to-config varenv1=pattern1,varenv2=pattern2 + For configuration variables containing a regular expression (essentially those ending + in ENV, and COUNTERCMD) this provides an alternative way to modify the configuration + variables. Instead of setting the complete pattern, with this option it is possible to add an + alternative pattern. varenv must be one of the variables listed above that take a regular + expression as argument, and pattern is any regular expression (which might need to be + protected from the shell by quotation). Several patterns can be added at once by using semi-colons + to separate them, e.g. --add-to-config "LISTENV=myitemize;myenumerate,COUNTERCMD=endnote" + +--packages=pkg1,pkg2,.. + Tell latexdiff that .tex file is processed with the packages in list + loaded. This is normally not necessary if the .tex file includes the + preamble, as the preamble is automatically scanned for \\usepackage commands. + Use of the --packages option disables automatic scanning, so if for any + reason package specific parsing needs to be switched off, use --packages=none. + The following packages trigger special behaviour: + endfloat hyperref amsmath apacite siunitx cleveref glossaries mhchem chemformula/chemmacros + [ Default: scan the preamble for \\usepackage commands to determine + loaded packages.] + +--show-preamble Print generated or included preamble commands to stdout. + +--show-safecmd Print list of regex matching and excluding safe commands. + +--show-textcmd Print list of regex matching and excluding commands with text argument. + +--show-config Show values of configuration variables + +--show-all Show all of the above + + NB For all --show commands, no old.tex or new.tex file needs to be given, and no + differencing takes place. + +Other configuration options: + +--allow-spaces Allow spaces between bracketed or braced arguments to commands + [Default requires arguments to directly follow each other without + intervening spaces] + +--math-markup=level Determine granularity of markup in displayed math environments: + Possible values for level are (both numerical and text labels are acceptable): + off or 0: suppress markup for math environments. Deleted equations will not + appear in diff file. This mode can be used if all the other modes + cause invalid latex code. + whole or 1: Differencing on the level of whole equations. Even trivial changes + to equations cause the whole equation to be marked changed. This + mode can be used if processing in coarse or fine mode results in + invalid latex code. + coarse or 2: Detect changes within equations marked up with a coarse + granularity; changes in equation type (e.g.displaymath to equation) + appear as a change to the complete equation. This mode is recommended + for situations where the content and order of some equations are still + being changed. [Default] + fine or 3: Detect small change in equations and mark up and fine granularity. + This mode is most suitable, if only minor changes to equations are + expected, e.g. correction of typos. + +--graphics-markup=level Change highlight style for graphics embedded with \\includegraphics commands + Possible values for level: + none,off or 0: no highlighting for figures + new-only or 1: surround newly added or changed figures with a blue frame [Default] + both or 2: highlight new figures with a blue frame and show deleted figures + at reduced scale, and crossed out with a red diagonal cross. Use configuration + variable SCALEDELGRAPHICS to set size of deleted figures. + Note that changes to the optional parameters will make the figure appear as changed + to latexdiff, and this figure will thus be highlighted. + +--disable-citation-markup +--disable-auto-mbox Suppress citation markup and markup of other vulnerable commands in styles + using ulem (UNDERLINE,FONTSTRIKE, CULINECHBAR) + (the two options are identical and are simply aliases) + +--enable-citation-markup +--enforce-auto-mbox Protect citation commands and other vulnerable commands in changed sections + with \\mbox command, i.e. use default behaviour for ulem package for other packages + (the two options are identical and are simply aliases) + +Miscelleneous options + +--label=label +-L label Sets the labels used to describe the old and new files. The first use + of this option sets the label describing the old file and the second + use of the option sets the label for the new file. + [Default: use the filename and modification dates for the label] + +--no-label Suppress inclusion of old and new file names as comment in output file + +--no-links Suppress generation of hyperrefs, used for minimal diffs + +--visible-label Include old and new filenames (or labels set with --label option) as + visible output + +--flatten Replace \\input and \\include commands within body by the content + of the files in their argument. If \\includeonly is present in the + preamble, only those files are expanded into the document. However, + no recursion is done, i.e. \\input and \\include commands within + included sections are not expanded. The included files are assumed to + be located in the same directories as the old and new master files, + respectively, making it possible to organise files into old and new directories. + --flatten is applied recursively, so inputted files can contain further + \\input statements. + +--help +-h Show this help text. + +--ignore-warnings Suppress warnings about inconsistencies in length between input + and parsed strings and missing characters. + +--verbose +-V Output various status information to stderr during processing. + Default is to work silently. + +--version Show version number. + +EOF +} + +=head1 NAME + +latexdiff - determine and markup differences between two latex files + +=head1 SYNOPSIS + +B [ B ] F F > F + +=head1 DESCRIPTION + +Briefly, I is a utility program to aid in the management of +revisions of latex documents. It compares two valid latex files, here +called C and C, finds significant differences +between them (i.e., ignoring the number of white spaces and position +of line breaks), and adds special commands to highlight the +differences. Where visual highlighting is not possible, e.g. for changes +in the formatting, the differences are +nevertheless marked up in the source. Note that old.tex and new.tex need to +be real files (not pipes or similar) as they are opened twice (unless C<--encoding> option is used) + +The program treats the preamble differently from the main document. +Differences between the preambles are found using line-based +differencing (similarly to the Unix diff command, but ignoring white +spaces). A comment, "S>>" is appended to each added line, i.e. a +line present in C but not in C. Discarded lines + are deactivated by prepending "S>>". Changed blocks are preceded by +comment lines giving information about line numbers in the original files. Where there are insignificant +differences, the resulting file C will be similar to +C. At the end of the preamble, the definitions for I markup commands are inserted. +In differencing the main body of the text, I attempts to +satisfy the following guidelines (in order of priority): + +=over 3 + +=item 1 + +If both C and C are valid LaTeX, then the resulting +C should also be valid LateX. (NB If a few plain TeX commands +are used within C or C then C is not +guaranteed to work but usually will). + +=item 2 + +Significant differences are determined on the level of +individual words. All significant differences, including differences +between comments should be clearly marked in the resulting source code +C. + +=item 3 + +If a changed passage contains text or text-producing commands, then +running C through LateX should produce output where added +and discarded passages are highlighted. + +=item 4 + +Where there are insignificant differences, e.g. in the positioning of +line breaks, C should follow the formatting of C + +=back + +For differencing the same algorithm as I is used but words +instead of lines are compared. An attempt is made to recognize +blocks which are completely changed such that they can be marked up as a unit. +Comments are differenced line by line +but the number of spaces within comments is ignored. Commands including +all their arguments are generally compared as one unit, i.e., no mark-up +is inserted into the arguments of commands. However, for a selected +number of commands (for example, C<\caption> and all sectioning +commands) the last argument is known to be text. This text is +split into words and differenced just as ordinary text (use options to +show and change the list of text commands, see below). As the +algorithm has no detailed knowledge of LaTeX, it assumes all pairs of +curly braces immediately following a command (i.e. a sequence of +letters beginning with a backslash) are arguments for that command. +As a restriction to condition 1 above it is thus necessary to surround +all arguments with curly braces, and to not insert +extraneous spaces. For example, write + + \section{\textem{This is an emphasized section title}} + +and not + + \section {\textem{This is an emphasized section title}} + +or + + \section\textem{This is an emphasized section title} + +even though all varieties are the same to LaTeX (but see +B<--allow-spaces> option which allows the second variety). + +For environments whose content does not conform to standard LaTeX or +where graphical markup does not make sense all markup commands can be +removed by setting the PICTUREENV configuration variable, set by +default to C and C environments; see B<--config> +option). The latter environment (C) can be used to +protect parts of the latex file where the markup results in illegal +markup. You have to surround the offending passage in both the old and +new file by C<\begin{DIFnomarkup}> and C<\end{DIFnomarkup}>. You must +define the environment in the preambles of both old and new +documents. I prefer to define it as a null-environment, + +C<\newenvironment{DIFnomarkup}{}{}> + +but the choice is yours. Any markup within the environment will be +removed, and generally everything within the environment will just be +taken from the new file. + +It is also possible to difference files which do not have a preamble. + In this case, the file is processed in the main document +mode, but the definitions of the markup commands are not inserted. + +All markup commands inserted by I begin with "C<\DIF>". Added +blocks containing words, commands or comments which are in C +but not in C are marked by C<\DIFaddbegin> and C<\DIFaddend>. +Discarded blocks are marked by C<\DIFdelbegin> and C<\DIFdelend>. +Within added blocks all text is highlighted with C<\DIFadd> like this: +C<\DIFadd{Added text block}> +Selected `safe' commands can be contained in these text blocks as well +(use options to show and change the list of safe commands, see below). +All other commands as well as braces "{" and "}" are never put within +the scope of C<\DIFadd>. Added comments are marked by prepending +"S >>". + +Within deleted blocks text is highlighted with C<\DIFdel>. Deleted +comments are marked by prepending "S >>". Non-safe command +and curly braces within deleted blocks are commented out with +"S >>". + + + +=head1 OPTIONS + +=head2 Preamble + +The following options determine the visual markup style by adding the appropriate +command definitions to the preamble. See the end of this section for a description of +available styles. + +=over 4 + +=item B<--type=markupstyle> or +B<-t markupstyle> + +Add code to preamble for selected markup style. This option defines +C<\DIFadd> and C<\DIFdel> commands. +Available styles: + +C + +[ Default: C ] + +=item B<--subtype=markstyle> or +B<-s markstyle> + +Add code to preamble for selected style for bracketing +commands (e.g. to mark changes in margin). This option defines +C<\DIFaddbegin>, C<\DIFaddend>, C<\DIFdelbegin> and C<\DIFdelend> commands. +Available styles: C + +[ Default: C ] +* Subtype C