From 542c10d074306f79a699aa3548518f9cc286a75a Mon Sep 17 00:00:00 2001 From: Richard Friedman Date: Tue, 13 Jan 2015 11:38:24 -0800 Subject: [PATCH] Initial add of all files --- Changes.log | 80 ++++ Examples_Chapt.tex | 9 + Examples_affinity.tex | 243 +++++++++++ Examples_array_sections.tex | 35 ++ Examples_associate.tex | 32 ++ Examples_async_target.tex | 31 ++ Examples_atomic.tex | 44 ++ Examples_atomic_restrict.tex | 25 ++ Examples_barrier_regions.tex | 24 ++ Examples_cancellation.tex | 42 ++ Examples_carrays_fpriv.tex | 37 ++ Examples_collapse.tex | 77 ++++ Examples_cond_comp.tex | 21 + Examples_copyin.tex | 13 + Examples_copyprivate.tex | 51 +++ Examples_critical.tex | 16 + Examples_declare_target.tex | 111 +++++ Examples_default_none.tex | 12 + Examples_device.tex | 35 ++ Examples_flush_nolist.tex | 12 + Examples_fort_do.tex | 19 + Examples_fort_loopvar.tex | 22 + Examples_fort_race.tex | 16 + Examples_fort_sa_private.tex | 23 + Examples_fort_sp_common.tex | 38 ++ Examples_fpriv_sections.tex | 18 + Examples_get_nthrs.tex | 21 + Examples_icv.tex | 56 +++ Examples_init_lock.tex | 11 + Examples_lastprivate.tex | 14 + Examples_lock_owner.tex | 23 + Examples_master.tex | 13 + Examples_mem_model.tex | 38 ++ Examples_nestable_lock.tex | 11 + Examples_nested_loop.tex | 18 + Examples_nesting_restrict.tex | 52 +++ Examples_nowait.tex | 28 ++ Examples_nthrs_dynamic.tex | 30 ++ Examples_nthrs_nesting.tex | 12 + Examples_ordered.tex | 28 ++ Examples_parallel.tex | 12 + Examples_ploop.tex | 11 + Examples_pra_iterator.tex | 11 + Examples_private.tex | 31 ++ Examples_psections.tex | 13 + Examples_reduction.tex | 60 +++ Examples_set_dynamic_nthrs.tex | 24 ++ Examples_simple_lock.tex | 19 + Examples_single.tex | 18 + Examples_standalone.tex | 31 ++ Examples_target.tex | 96 +++++ Examples_target_data.tex | 175 ++++++++ Examples_target_update.tex | 53 +++ Examples_taskgroup.tex | 20 + Examples_tasking.tex | 258 ++++++++++++ Examples_taskyield.tex | 14 + Examples_teams.tex | 118 ++++++ Examples_threadprivate.tex | 106 +++++ Examples_workshare.tex | 76 ++++ Examples_worksharing_critical.tex | 18 + Introduction_Chapt.tex | 69 +++ Makefile | 88 ++++ README | 3 + Title_Page.tex | 42 ++ figs/proc_bind_fig.pdf | Bin 0 -> 22804 bytes figs/proc_bind_fig.png | Bin 0 -> 12942 bytes openmp-examples.tex | 137 ++++++ openmp-logo.png | Bin 0 -> 3300 bytes openmp.sty | 484 ++++++++++++++++++++++ sources/Example_affinity.1c.c | 15 + sources/Example_affinity.1f.f | 10 + sources/Example_affinity.2c.c | 15 + sources/Example_affinity.2f.f | 10 + sources/Example_affinity.3c.c | 15 + sources/Example_affinity.3f.f | 10 + sources/Example_affinity.4c.c | 15 + sources/Example_affinity.4f.f | 10 + sources/Example_affinity.5c.c | 15 + sources/Example_affinity.5f.f | 10 + sources/Example_array_sections.1c.c | 19 + sources/Example_array_sections.1f.f | 15 + sources/Example_array_sections.2c.c | 23 + sources/Example_array_sections.2f.f | 20 + sources/Example_array_sections.3c.c | 20 + sources/Example_array_sections.3f.f | 16 + sources/Example_array_sections.4c.c | 21 + sources/Example_array_sections.4f.f | 17 + sources/Example_associate.1f.f | 13 + sources/Example_associate.2f.f | 15 + sources/Example_associate.3f.f | 16 + sources/Example_async_target.1c.c | 28 ++ sources/Example_async_target.1f.f | 38 ++ sources/Example_async_target.2c.c | 39 ++ sources/Example_async_target.2f.f | 39 ++ sources/Example_atomic.1c.c | 45 ++ sources/Example_atomic.1f.f | 49 +++ sources/Example_atomic.2c.c | 27 ++ sources/Example_atomic.2f.f | 24 ++ sources/Example_atomic.3c.c | 44 ++ sources/Example_atomic.3f.f | 50 +++ sources/Example_atomic_restrict.1c.c | 23 + sources/Example_atomic_restrict.1f.f | 19 + sources/Example_atomic_restrict.2c.c | 29 ++ sources/Example_atomic_restrict.2f.f | 24 ++ sources/Example_atomic_restrict.3f.f | 25 ++ sources/Example_barrier_regions.1c.c | 40 ++ sources/Example_barrier_regions.1f.f | 40 ++ sources/Example_cancellation.1c.c | 38 ++ sources/Example_cancellation.1f.f | 29 ++ sources/Example_cancellation.2c.c | 53 +++ sources/Example_cancellation.2f.f | 71 ++++ sources/Example_carrays_fpriv.1c.c | 38 ++ sources/Example_collapse.1c.c | 18 + sources/Example_collapse.1f.f | 20 + sources/Example_collapse.2c.c | 24 ++ sources/Example_collapse.2f.f | 20 + sources/Example_collapse.3c.c | 26 ++ sources/Example_collapse.3f.f | 20 + sources/Example_cond_comp.1c.c | 18 + sources/Example_cond_comp.1f.f | 11 + sources/Example_copyin.1c.c | 31 ++ sources/Example_copyin.1f.f | 28 ++ sources/Example_copyprivate.1c.c | 17 + sources/Example_copyprivate.1f.f | 15 + sources/Example_copyprivate.2c.c | 36 ++ sources/Example_copyprivate.2f.f | 24 ++ sources/Example_copyprivate.3c.c | 23 + sources/Example_copyprivate.3f.f | 14 + sources/Example_copyprivate.4f.f | 25 ++ sources/Example_critical.1c.c | 26 ++ sources/Example_critical.1f.f | 25 ++ sources/Example_declare_target.1c.c | 18 + sources/Example_declare_target.1f.f | 23 + sources/Example_declare_target.2c.c | 28 ++ sources/Example_declare_target.2f.f | 18 + sources/Example_declare_target.3c.c | 25 ++ sources/Example_declare_target.3f.f | 24 ++ sources/Example_declare_target.4c.c | 23 + sources/Example_declare_target.4f.f | 29 ++ sources/Example_declare_target.5c.c | 33 ++ sources/Example_declare_target.5f.f | 35 ++ sources/Example_default_none.1c.c | 34 ++ sources/Example_default_none.1f.f | 37 ++ sources/Example_device.1c.c | 43 ++ sources/Example_device.1f.f | 38 ++ sources/Example_device.2c.c | 22 + sources/Example_device.2f.f | 21 + sources/Example_device.3c.c | 17 + sources/Example_device.3f.f | 15 + sources/Example_flush_nolist.1c.c | 58 +++ sources/Example_flush_nolist.1f.f | 68 +++ sources/Example_fort_do.1f.f | 31 ++ sources/Example_fort_do.2f.f | 19 + sources/Example_fort_loopvar.1f.f | 19 + sources/Example_fort_loopvar.2f.f | 27 ++ sources/Example_fort_race.1f.f | 29 ++ sources/Example_fort_sa_private.1f.f | 18 + sources/Example_fort_sa_private.2f.f | 24 ++ sources/Example_fort_sa_private.3f.f | 15 + sources/Example_fort_sa_private.4f.f | 31 ++ sources/Example_fort_sa_private.5f.f | 41 ++ sources/Example_fort_sp_common.1f.f | 16 + sources/Example_fort_sp_common.2f.f | 22 + sources/Example_fort_sp_common.3f.f | 14 + sources/Example_fort_sp_common.4f.f | 12 + sources/Example_fort_sp_common.5f.f | 14 + sources/Example_fpriv_sections.1c.c | 32 ++ sources/Example_fpriv_sections.1f.f | 24 ++ sources/Example_get_nthrs.1c.c | 20 + sources/Example_get_nthrs.1f.f | 21 + sources/Example_get_nthrs.2c.c | 20 + sources/Example_get_nthrs.2f.f | 22 + sources/Example_icv.1c.c | 50 +++ sources/Example_icv.1f.f | 38 ++ sources/Example_init_lock.1c.c | 21 + sources/Example_init_lock.1f.f | 18 + sources/Example_lastprivate.1c.c | 20 + sources/Example_lastprivate.1f.f | 21 + sources/Example_lock_owner.1c.c | 33 ++ sources/Example_lock_owner.1f.f | 25 ++ sources/Example_master.1c.c | 42 ++ sources/Example_master.1f.f | 36 ++ sources/Example_mem_model.1c.c | 36 ++ sources/Example_mem_model.1f.f | 32 ++ sources/Example_mem_model.2c.c | 48 +++ sources/Example_mem_model.2f.f | 38 ++ sources/Example_mem_model.3c.c | 50 +++ sources/Example_mem_model.3f.f | 40 ++ sources/Example_nestable_lock.1c.c | 46 ++ sources/Example_nestable_lock.1f.f | 63 +++ sources/Example_nested_loop.1c.c | 25 ++ sources/Example_nested_loop.1f.f | 25 ++ sources/Example_nested_loop.2c.c | 32 ++ sources/Example_nested_loop.2f.f | 28 ++ sources/Example_nesting_restrict.1c.c | 22 + sources/Example_nesting_restrict.1f.f | 21 + sources/Example_nesting_restrict.2c.c | 27 ++ sources/Example_nesting_restrict.2f.f | 23 + sources/Example_nesting_restrict.3c.c | 21 + sources/Example_nesting_restrict.3f.f | 18 + sources/Example_nesting_restrict.4c.c | 23 + sources/Example_nesting_restrict.4f.f | 19 + sources/Example_nesting_restrict.5c.c | 21 + sources/Example_nesting_restrict.5f.f | 17 + sources/Example_nesting_restrict.6c.c | 21 + sources/Example_nesting_restrict.6f.f | 17 + sources/Example_nowait.1c.c | 23 + sources/Example_nowait.1f.f | 29 ++ sources/Example_nowait.2c.c | 26 ++ sources/Example_nowait.2f.f | 27 ++ sources/Example_nthrs_dynamic.1c.c | 17 + sources/Example_nthrs_dynamic.1f.f | 12 + sources/Example_nthrs_dynamic.2c.c | 17 + sources/Example_nthrs_dynamic.2f.f | 12 + sources/Example_nthrs_nesting.1c.c | 58 +++ sources/Example_nthrs_nesting.1f.f | 40 ++ sources/Example_ordered.1c.c | 29 ++ sources/Example_ordered.1f.f | 29 ++ sources/Example_ordered.2c.c | 22 + sources/Example_ordered.2f.f | 26 ++ sources/Example_ordered.3c.c | 23 + sources/Example_ordered.3f.f | 23 + sources/Example_parallel.1c.c | 41 ++ sources/Example_parallel.1f.f | 42 ++ sources/Example_ploop.1c.c | 15 + sources/Example_ploop.1f.f | 17 + sources/Example_pra_iterator.1c.c | 18 + sources/Example_private.1c.c | 32 ++ sources/Example_private.1f.f | 18 + sources/Example_private.2c.c | 25 ++ sources/Example_private.2f.f | 31 ++ sources/Example_private.3c.c | 23 + sources/Example_private.3f.f | 18 + sources/Example_psections.1c.c | 25 ++ sources/Example_psections.1f.f | 17 + sources/Example_reduction.1c.c | 26 ++ sources/Example_reduction.1f.f | 23 + sources/Example_reduction.2c.c | 40 ++ sources/Example_reduction.2f.f | 35 ++ sources/Example_reduction.3c.c | 29 ++ sources/Example_reduction.3f.f | 20 + sources/Example_reduction.4f.f | 17 + sources/Example_reduction.5f.f | 20 + sources/Example_reduction.6f.f | 26 ++ sources/Example_set_dynamic_nthrs.1c.c | 29 ++ sources/Example_set_dynamic_nthrs.1f.f | 35 ++ sources/Example_simple_lock.1c.c | 40 ++ sources/Example_simple_lock.1f.f | 41 ++ sources/Example_single.1c.c | 30 ++ sources/Example_single.1f.f | 33 ++ sources/Example_standalone.1c.c | 33 ++ sources/Example_standalone.1f.f | 46 ++ sources/Example_standalone.2c.c | 27 ++ sources/Example_standalone.2f.f | 33 ++ sources/Example_target.1c.c | 20 + sources/Example_target.1f.f | 17 + sources/Example_target.2c.c | 20 + sources/Example_target.2f.f | 17 + sources/Example_target.3c.c | 20 + sources/Example_target.3f.f | 17 + sources/Example_target.4bf.f | 20 + sources/Example_target.4c.c | 19 + sources/Example_target.4f.f | 20 + sources/Example_target.5c.c | 22 + sources/Example_target.5f.f | 21 + sources/Example_target_data.1c.c | 22 + sources/Example_target_data.1f.f | 19 + sources/Example_target_data.2c.c | 28 ++ sources/Example_target_data.2f.f | 26 ++ sources/Example_target_data.3c.c | 25 ++ sources/Example_target_data.3f.f | 27 ++ sources/Example_target_data.4c.c | 26 ++ sources/Example_target_data.4f.f | 27 ++ sources/Example_target_data.5c.c | 27 ++ sources/Example_target_data.5f.f | 34 ++ sources/Example_target_data.6c.c | 29 ++ sources/Example_target_data.6f.f | 30 ++ sources/Example_target_data.7c.c | 23 + sources/Example_target_data.7f.f | 23 + sources/Example_target_update.1c.c | 29 ++ sources/Example_target_update.1f.f | 27 ++ sources/Example_target_update.2c.c | 32 ++ sources/Example_target_update.2f.f | 36 ++ sources/Example_taskgroup.1c.c | 59 +++ sources/Example_taskgroup.1f.f | 53 +++ sources/Example_tasking.10c.c | 30 ++ sources/Example_tasking.10f.f | 30 ++ sources/Example_tasking.11c.c | 18 + sources/Example_tasking.11f.f | 14 + sources/Example_tasking.12c.c | 18 + sources/Example_tasking.12f.f | 14 + sources/Example_tasking.13c.c | 39 ++ sources/Example_tasking.13f.f | 33 ++ sources/Example_tasking.14c.c | 27 ++ sources/Example_tasking.14f.f | 26 ++ sources/Example_tasking.15c.c | 21 + sources/Example_tasking.15f.f | 19 + sources/Example_tasking.16c.c | 21 + sources/Example_tasking.16f.f | 19 + sources/Example_tasking.17c.c | 23 + sources/Example_tasking.17f.f | 20 + sources/Example_tasking.18c.c | 23 + sources/Example_tasking.18f.f | 22 + sources/Example_tasking.19c.c | 25 ++ sources/Example_tasking.19f.f | 27 ++ sources/Example_tasking.1c.c | 21 + sources/Example_tasking.1f.f | 22 + sources/Example_tasking.2c.c | 22 + sources/Example_tasking.2f.f | 23 + sources/Example_tasking.3c.c | 33 ++ sources/Example_tasking.3f.f | 33 ++ sources/Example_tasking.4c.c | 20 + sources/Example_tasking.4f.f | 20 + sources/Example_tasking.5c.c | 23 + sources/Example_tasking.5f.f | 19 + sources/Example_tasking.6c.c | 27 ++ sources/Example_tasking.6f.f | 19 + sources/Example_tasking.7c.c | 29 ++ sources/Example_tasking.7f.f | 26 ++ sources/Example_tasking.8c.c | 28 ++ sources/Example_tasking.8f.f | 24 ++ sources/Example_tasking.9c.c | 24 ++ sources/Example_tasking.9f.f | 28 ++ sources/Example_taskyield.1c.c | 26 ++ sources/Example_taskyield.1f.f | 23 + sources/Example_teams.1c.c | 34 ++ sources/Example_teams.1f.f | 29 ++ sources/Example_teams.2c.c | 22 + sources/Example_teams.2f.f | 23 + sources/Example_teams.3c.c | 17 + sources/Example_teams.3f.f | 17 + sources/Example_teams.4c.c | 20 + sources/Example_teams.4f.f | 24 ++ sources/Example_teams.5c.c | 19 + sources/Example_teams.5f.f | 17 + sources/Example_teams.6c.c | 19 + sources/Example_teams.6f.f | 17 + sources/Example_threadprivate.1c.c | 15 + sources/Example_threadprivate.1f.f | 13 + sources/Example_threadprivate.2c.c | 14 + sources/Example_threadprivate.2f.f | 14 + sources/Example_threadprivate.3c.c | 44 ++ sources/Example_threadprivate.3f.f | 16 + sources/Example_threadprivate.4c.c | 13 + sources/Example_threadprivate.4f.f | 18 + sources/Example_threadprivate.5c.c | 12 + sources/Example_threadprivate.5f.f | 40 ++ sources/Example_threadprivate.6f.f | 30 ++ sources/Example_workshare.1f.f | 18 + sources/Example_workshare.2f.f | 20 + sources/Example_workshare.3f.f | 19 + sources/Example_workshare.4f.f | 21 + sources/Example_workshare.5f.f | 20 + sources/Example_workshare.6f.f | 20 + sources/Example_workshare.7f.f | 17 + sources/Example_worksharing_critical.1c.c | 27 ++ sources/Example_worksharing_critical.1f.f | 21 + 357 files changed, 10840 insertions(+) create mode 100644 Changes.log create mode 100644 Examples_Chapt.tex create mode 100644 Examples_affinity.tex create mode 100644 Examples_array_sections.tex create mode 100644 Examples_associate.tex create mode 100644 Examples_async_target.tex create mode 100644 Examples_atomic.tex create mode 100644 Examples_atomic_restrict.tex create mode 100644 Examples_barrier_regions.tex create mode 100644 Examples_cancellation.tex create mode 100644 Examples_carrays_fpriv.tex create mode 100644 Examples_collapse.tex create mode 100644 Examples_cond_comp.tex create mode 100644 Examples_copyin.tex create mode 100644 Examples_copyprivate.tex create mode 100644 Examples_critical.tex create mode 100644 Examples_declare_target.tex create mode 100644 Examples_default_none.tex create mode 100644 Examples_device.tex create mode 100644 Examples_flush_nolist.tex create mode 100644 Examples_fort_do.tex create mode 100644 Examples_fort_loopvar.tex create mode 100644 Examples_fort_race.tex create mode 100644 Examples_fort_sa_private.tex create mode 100644 Examples_fort_sp_common.tex create mode 100644 Examples_fpriv_sections.tex create mode 100644 Examples_get_nthrs.tex create mode 100644 Examples_icv.tex create mode 100644 Examples_init_lock.tex create mode 100644 Examples_lastprivate.tex create mode 100644 Examples_lock_owner.tex create mode 100644 Examples_master.tex create mode 100644 Examples_mem_model.tex create mode 100644 Examples_nestable_lock.tex create mode 100644 Examples_nested_loop.tex create mode 100644 Examples_nesting_restrict.tex create mode 100644 Examples_nowait.tex create mode 100644 Examples_nthrs_dynamic.tex create mode 100644 Examples_nthrs_nesting.tex create mode 100644 Examples_ordered.tex create mode 100644 Examples_parallel.tex create mode 100644 Examples_ploop.tex create mode 100644 Examples_pra_iterator.tex create mode 100644 Examples_private.tex create mode 100644 Examples_psections.tex create mode 100644 Examples_reduction.tex create mode 100644 Examples_set_dynamic_nthrs.tex create mode 100644 Examples_simple_lock.tex create mode 100644 Examples_single.tex create mode 100644 Examples_standalone.tex create mode 100644 Examples_target.tex create mode 100644 Examples_target_data.tex create mode 100644 Examples_target_update.tex create mode 100644 Examples_taskgroup.tex create mode 100644 Examples_tasking.tex create mode 100644 Examples_taskyield.tex create mode 100644 Examples_teams.tex create mode 100644 Examples_threadprivate.tex create mode 100644 Examples_workshare.tex create mode 100644 Examples_worksharing_critical.tex create mode 100644 Introduction_Chapt.tex create mode 100644 Makefile create mode 100644 README create mode 100644 Title_Page.tex create mode 100644 figs/proc_bind_fig.pdf create mode 100644 figs/proc_bind_fig.png create mode 100644 openmp-examples.tex create mode 100644 openmp-logo.png create mode 100644 openmp.sty create mode 100644 sources/Example_affinity.1c.c create mode 100644 sources/Example_affinity.1f.f create mode 100644 sources/Example_affinity.2c.c create mode 100644 sources/Example_affinity.2f.f create mode 100644 sources/Example_affinity.3c.c create mode 100644 sources/Example_affinity.3f.f create mode 100644 sources/Example_affinity.4c.c create mode 100644 sources/Example_affinity.4f.f create mode 100644 sources/Example_affinity.5c.c create mode 100644 sources/Example_affinity.5f.f create mode 100644 sources/Example_array_sections.1c.c create mode 100644 sources/Example_array_sections.1f.f create mode 100644 sources/Example_array_sections.2c.c create mode 100644 sources/Example_array_sections.2f.f create mode 100644 sources/Example_array_sections.3c.c create mode 100644 sources/Example_array_sections.3f.f create mode 100644 sources/Example_array_sections.4c.c create mode 100644 sources/Example_array_sections.4f.f create mode 100644 sources/Example_associate.1f.f create mode 100644 sources/Example_associate.2f.f create mode 100644 sources/Example_associate.3f.f create mode 100644 sources/Example_async_target.1c.c create mode 100644 sources/Example_async_target.1f.f create mode 100644 sources/Example_async_target.2c.c create mode 100644 sources/Example_async_target.2f.f create mode 100644 sources/Example_atomic.1c.c create mode 100644 sources/Example_atomic.1f.f create mode 100644 sources/Example_atomic.2c.c create mode 100644 sources/Example_atomic.2f.f create mode 100644 sources/Example_atomic.3c.c create mode 100644 sources/Example_atomic.3f.f create mode 100644 sources/Example_atomic_restrict.1c.c create mode 100644 sources/Example_atomic_restrict.1f.f create mode 100644 sources/Example_atomic_restrict.2c.c create mode 100644 sources/Example_atomic_restrict.2f.f create mode 100644 sources/Example_atomic_restrict.3f.f create mode 100644 sources/Example_barrier_regions.1c.c create mode 100644 sources/Example_barrier_regions.1f.f create mode 100644 sources/Example_cancellation.1c.c create mode 100644 sources/Example_cancellation.1f.f create mode 100644 sources/Example_cancellation.2c.c create mode 100644 sources/Example_cancellation.2f.f create mode 100644 sources/Example_carrays_fpriv.1c.c create mode 100644 sources/Example_collapse.1c.c create mode 100644 sources/Example_collapse.1f.f create mode 100644 sources/Example_collapse.2c.c create mode 100644 sources/Example_collapse.2f.f create mode 100644 sources/Example_collapse.3c.c create mode 100644 sources/Example_collapse.3f.f create mode 100644 sources/Example_cond_comp.1c.c create mode 100644 sources/Example_cond_comp.1f.f create mode 100644 sources/Example_copyin.1c.c create mode 100644 sources/Example_copyin.1f.f create mode 100644 sources/Example_copyprivate.1c.c create mode 100644 sources/Example_copyprivate.1f.f create mode 100644 sources/Example_copyprivate.2c.c create mode 100644 sources/Example_copyprivate.2f.f create mode 100644 sources/Example_copyprivate.3c.c create mode 100644 sources/Example_copyprivate.3f.f create mode 100644 sources/Example_copyprivate.4f.f create mode 100644 sources/Example_critical.1c.c create mode 100644 sources/Example_critical.1f.f create mode 100644 sources/Example_declare_target.1c.c create mode 100644 sources/Example_declare_target.1f.f create mode 100644 sources/Example_declare_target.2c.c create mode 100644 sources/Example_declare_target.2f.f create mode 100644 sources/Example_declare_target.3c.c create mode 100644 sources/Example_declare_target.3f.f create mode 100644 sources/Example_declare_target.4c.c create mode 100644 sources/Example_declare_target.4f.f create mode 100644 sources/Example_declare_target.5c.c create mode 100644 sources/Example_declare_target.5f.f create mode 100644 sources/Example_default_none.1c.c create mode 100644 sources/Example_default_none.1f.f create mode 100644 sources/Example_device.1c.c create mode 100644 sources/Example_device.1f.f create mode 100644 sources/Example_device.2c.c create mode 100644 sources/Example_device.2f.f create mode 100644 sources/Example_device.3c.c create mode 100644 sources/Example_device.3f.f create mode 100644 sources/Example_flush_nolist.1c.c create mode 100644 sources/Example_flush_nolist.1f.f create mode 100644 sources/Example_fort_do.1f.f create mode 100644 sources/Example_fort_do.2f.f create mode 100644 sources/Example_fort_loopvar.1f.f create mode 100644 sources/Example_fort_loopvar.2f.f create mode 100644 sources/Example_fort_race.1f.f create mode 100644 sources/Example_fort_sa_private.1f.f create mode 100644 sources/Example_fort_sa_private.2f.f create mode 100644 sources/Example_fort_sa_private.3f.f create mode 100644 sources/Example_fort_sa_private.4f.f create mode 100644 sources/Example_fort_sa_private.5f.f create mode 100644 sources/Example_fort_sp_common.1f.f create mode 100644 sources/Example_fort_sp_common.2f.f create mode 100644 sources/Example_fort_sp_common.3f.f create mode 100644 sources/Example_fort_sp_common.4f.f create mode 100644 sources/Example_fort_sp_common.5f.f create mode 100644 sources/Example_fpriv_sections.1c.c create mode 100644 sources/Example_fpriv_sections.1f.f create mode 100644 sources/Example_get_nthrs.1c.c create mode 100644 sources/Example_get_nthrs.1f.f create mode 100644 sources/Example_get_nthrs.2c.c create mode 100644 sources/Example_get_nthrs.2f.f create mode 100644 sources/Example_icv.1c.c create mode 100644 sources/Example_icv.1f.f create mode 100644 sources/Example_init_lock.1c.c create mode 100644 sources/Example_init_lock.1f.f create mode 100644 sources/Example_lastprivate.1c.c create mode 100644 sources/Example_lastprivate.1f.f create mode 100644 sources/Example_lock_owner.1c.c create mode 100644 sources/Example_lock_owner.1f.f create mode 100644 sources/Example_master.1c.c create mode 100644 sources/Example_master.1f.f create mode 100644 sources/Example_mem_model.1c.c create mode 100644 sources/Example_mem_model.1f.f create mode 100644 sources/Example_mem_model.2c.c create mode 100644 sources/Example_mem_model.2f.f create mode 100644 sources/Example_mem_model.3c.c create mode 100644 sources/Example_mem_model.3f.f create mode 100644 sources/Example_nestable_lock.1c.c create mode 100644 sources/Example_nestable_lock.1f.f create mode 100644 sources/Example_nested_loop.1c.c create mode 100644 sources/Example_nested_loop.1f.f create mode 100644 sources/Example_nested_loop.2c.c create mode 100644 sources/Example_nested_loop.2f.f create mode 100644 sources/Example_nesting_restrict.1c.c create mode 100644 sources/Example_nesting_restrict.1f.f create mode 100644 sources/Example_nesting_restrict.2c.c create mode 100644 sources/Example_nesting_restrict.2f.f create mode 100644 sources/Example_nesting_restrict.3c.c create mode 100644 sources/Example_nesting_restrict.3f.f create mode 100644 sources/Example_nesting_restrict.4c.c create mode 100644 sources/Example_nesting_restrict.4f.f create mode 100644 sources/Example_nesting_restrict.5c.c create mode 100644 sources/Example_nesting_restrict.5f.f create mode 100644 sources/Example_nesting_restrict.6c.c create mode 100644 sources/Example_nesting_restrict.6f.f create mode 100644 sources/Example_nowait.1c.c create mode 100644 sources/Example_nowait.1f.f create mode 100644 sources/Example_nowait.2c.c create mode 100644 sources/Example_nowait.2f.f create mode 100644 sources/Example_nthrs_dynamic.1c.c create mode 100644 sources/Example_nthrs_dynamic.1f.f create mode 100644 sources/Example_nthrs_dynamic.2c.c create mode 100644 sources/Example_nthrs_dynamic.2f.f create mode 100644 sources/Example_nthrs_nesting.1c.c create mode 100644 sources/Example_nthrs_nesting.1f.f create mode 100644 sources/Example_ordered.1c.c create mode 100644 sources/Example_ordered.1f.f create mode 100644 sources/Example_ordered.2c.c create mode 100644 sources/Example_ordered.2f.f create mode 100644 sources/Example_ordered.3c.c create mode 100644 sources/Example_ordered.3f.f create mode 100644 sources/Example_parallel.1c.c create mode 100644 sources/Example_parallel.1f.f create mode 100644 sources/Example_ploop.1c.c create mode 100644 sources/Example_ploop.1f.f create mode 100644 sources/Example_pra_iterator.1c.c create mode 100644 sources/Example_private.1c.c create mode 100644 sources/Example_private.1f.f create mode 100644 sources/Example_private.2c.c create mode 100644 sources/Example_private.2f.f create mode 100644 sources/Example_private.3c.c create mode 100644 sources/Example_private.3f.f create mode 100644 sources/Example_psections.1c.c create mode 100644 sources/Example_psections.1f.f create mode 100644 sources/Example_reduction.1c.c create mode 100644 sources/Example_reduction.1f.f create mode 100644 sources/Example_reduction.2c.c create mode 100644 sources/Example_reduction.2f.f create mode 100644 sources/Example_reduction.3c.c create mode 100644 sources/Example_reduction.3f.f create mode 100644 sources/Example_reduction.4f.f create mode 100644 sources/Example_reduction.5f.f create mode 100644 sources/Example_reduction.6f.f create mode 100644 sources/Example_set_dynamic_nthrs.1c.c create mode 100644 sources/Example_set_dynamic_nthrs.1f.f create mode 100644 sources/Example_simple_lock.1c.c create mode 100644 sources/Example_simple_lock.1f.f create mode 100644 sources/Example_single.1c.c create mode 100644 sources/Example_single.1f.f create mode 100644 sources/Example_standalone.1c.c create mode 100644 sources/Example_standalone.1f.f create mode 100644 sources/Example_standalone.2c.c create mode 100644 sources/Example_standalone.2f.f create mode 100644 sources/Example_target.1c.c create mode 100644 sources/Example_target.1f.f create mode 100644 sources/Example_target.2c.c create mode 100644 sources/Example_target.2f.f create mode 100644 sources/Example_target.3c.c create mode 100644 sources/Example_target.3f.f create mode 100644 sources/Example_target.4bf.f create mode 100644 sources/Example_target.4c.c create mode 100644 sources/Example_target.4f.f create mode 100644 sources/Example_target.5c.c create mode 100644 sources/Example_target.5f.f create mode 100644 sources/Example_target_data.1c.c create mode 100644 sources/Example_target_data.1f.f create mode 100644 sources/Example_target_data.2c.c create mode 100644 sources/Example_target_data.2f.f create mode 100644 sources/Example_target_data.3c.c create mode 100644 sources/Example_target_data.3f.f create mode 100644 sources/Example_target_data.4c.c create mode 100644 sources/Example_target_data.4f.f create mode 100644 sources/Example_target_data.5c.c create mode 100644 sources/Example_target_data.5f.f create mode 100644 sources/Example_target_data.6c.c create mode 100644 sources/Example_target_data.6f.f create mode 100644 sources/Example_target_data.7c.c create mode 100644 sources/Example_target_data.7f.f create mode 100644 sources/Example_target_update.1c.c create mode 100644 sources/Example_target_update.1f.f create mode 100644 sources/Example_target_update.2c.c create mode 100644 sources/Example_target_update.2f.f create mode 100644 sources/Example_taskgroup.1c.c create mode 100644 sources/Example_taskgroup.1f.f create mode 100644 sources/Example_tasking.10c.c create mode 100644 sources/Example_tasking.10f.f create mode 100644 sources/Example_tasking.11c.c create mode 100644 sources/Example_tasking.11f.f create mode 100644 sources/Example_tasking.12c.c create mode 100644 sources/Example_tasking.12f.f create mode 100644 sources/Example_tasking.13c.c create mode 100644 sources/Example_tasking.13f.f create mode 100644 sources/Example_tasking.14c.c create mode 100644 sources/Example_tasking.14f.f create mode 100644 sources/Example_tasking.15c.c create mode 100644 sources/Example_tasking.15f.f create mode 100644 sources/Example_tasking.16c.c create mode 100644 sources/Example_tasking.16f.f create mode 100644 sources/Example_tasking.17c.c create mode 100644 sources/Example_tasking.17f.f create mode 100644 sources/Example_tasking.18c.c create mode 100644 sources/Example_tasking.18f.f create mode 100644 sources/Example_tasking.19c.c create mode 100644 sources/Example_tasking.19f.f create mode 100644 sources/Example_tasking.1c.c create mode 100644 sources/Example_tasking.1f.f create mode 100644 sources/Example_tasking.2c.c create mode 100644 sources/Example_tasking.2f.f create mode 100644 sources/Example_tasking.3c.c create mode 100644 sources/Example_tasking.3f.f create mode 100644 sources/Example_tasking.4c.c create mode 100644 sources/Example_tasking.4f.f create mode 100644 sources/Example_tasking.5c.c create mode 100644 sources/Example_tasking.5f.f create mode 100644 sources/Example_tasking.6c.c create mode 100644 sources/Example_tasking.6f.f create mode 100644 sources/Example_tasking.7c.c create mode 100644 sources/Example_tasking.7f.f create mode 100644 sources/Example_tasking.8c.c create mode 100644 sources/Example_tasking.8f.f create mode 100644 sources/Example_tasking.9c.c create mode 100644 sources/Example_tasking.9f.f create mode 100644 sources/Example_taskyield.1c.c create mode 100644 sources/Example_taskyield.1f.f create mode 100644 sources/Example_teams.1c.c create mode 100644 sources/Example_teams.1f.f create mode 100644 sources/Example_teams.2c.c create mode 100644 sources/Example_teams.2f.f create mode 100644 sources/Example_teams.3c.c create mode 100644 sources/Example_teams.3f.f create mode 100644 sources/Example_teams.4c.c create mode 100644 sources/Example_teams.4f.f create mode 100644 sources/Example_teams.5c.c create mode 100644 sources/Example_teams.5f.f create mode 100644 sources/Example_teams.6c.c create mode 100644 sources/Example_teams.6f.f create mode 100644 sources/Example_threadprivate.1c.c create mode 100644 sources/Example_threadprivate.1f.f create mode 100644 sources/Example_threadprivate.2c.c create mode 100644 sources/Example_threadprivate.2f.f create mode 100644 sources/Example_threadprivate.3c.c create mode 100644 sources/Example_threadprivate.3f.f create mode 100644 sources/Example_threadprivate.4c.c create mode 100644 sources/Example_threadprivate.4f.f create mode 100644 sources/Example_threadprivate.5c.c create mode 100644 sources/Example_threadprivate.5f.f create mode 100644 sources/Example_threadprivate.6f.f create mode 100644 sources/Example_workshare.1f.f create mode 100644 sources/Example_workshare.2f.f create mode 100644 sources/Example_workshare.3f.f create mode 100644 sources/Example_workshare.4f.f create mode 100644 sources/Example_workshare.5f.f create mode 100644 sources/Example_workshare.6f.f create mode 100644 sources/Example_workshare.7f.f create mode 100644 sources/Example_worksharing_critical.1c.c create mode 100644 sources/Example_worksharing_critical.1f.f diff --git a/Changes.log b/Changes.log new file mode 100644 index 0000000..b47860c --- /dev/null +++ b/Changes.log @@ -0,0 +1,80 @@ +[6-Jan-2015] Version 4.0.1ltx +Changes from 4.0.1ltx-21Nov-2014 + +1. openmp.sty and openmp-examples.tex + enable source line numbering + +2. Split chapters in the main file (Examples_Sects.tex) into individual files + Makefile and openmp-examples.tex were modified to use the new list. + +3. Additional changes related to fixing fonts and language markers + +Below is a summary. + ++Page 2: "non- compound" -> "non-compound" ++Page 10: fixed mis-placed language markers ++Chap-8, page 24: fixed variable fonts for T, P, T/P ++Chap-19. page 79-80: added missing Fortran cont. marker ++Chap-25, page 100: combined 25.2f & 25.3f into one Fortran marker ++Chap-30, page 120: combined 30.2c & 30.3c into one C/C++ marker ++Chap-30, page 122-123: added missing Fortran cont. marker ++Chap-32, page 127: added missing Fortran cont. marker ++Chap-36, page 138-139: added missing Fortran cont. marker ++Chap-39, page 147: added missing Fortran cont. marker ++Chap-50, page 182: fixed variables p, v1, v2 fonts ++Chap-51, page 189: fixed variables p, v1, v2 fonts ++Chap-52. page 201: fixed variable fonts, function fonts ++Chap-53. page 205: fixed variable fonts, function fonts ++Chap-54. page 215: fixed variable fonts ++Chap-58, page 237: fixed variable fonts ++Chap-58, page 237: Minor wording change to reflect the new placement of the Example header. + +Modification applied to the following files: + Examples_Chapt.tex + Examples_affinity.tex + Examples_associate.tex + Examples_atomic_restrict.tex + Examples_cond_comp.tex + Examples_declare_target.tex + Examples_fort_sa_private.tex + Examples_fort_sp_common.tex + Examples_reduction.tex + Examples_target.tex + Examples_target_data.tex + Examples_target_update.tex + Examples_teams.tex + Examples_threadprivate.tex + Examples_workshare.tex + +4. Other notes + ++Chap-12, page 37: placement of C/C++ marker changed, but OK ++Chap-29, page 114: marker moved, but OK. ++Chap-50, page 187: Example 50.4bf header added. + Fortran marker changed, but OK ++Chap-51, page 192: "Example 51.3c" added, and example numbering + shifted thereafter. + + +[21-Nov-2014] Initial 4.0.1ltx +Changes from 4.0.1ltx-3Jun2014 + +1. openmp.sty + change from using mnemonics + \def\ename{\escstr{#1}.#2} + to seqential numbering + \def\ename{\thechapter.#2} + + For "fnexample()" definition, firstline=6, not 8 + +2. source file changes + sources - use the "original" sources from 4.0.1 + +3. Version Number + openmp-examples.tex: + change footnote "Version 4.0 - July 2013" + to "Version 4.0.1 - February 2014" + Title_Page.tex: + change from "November, 2013" to "February, 2014" + "1997-2013" -> "1997-2014" + diff --git a/Examples_Chapt.tex b/Examples_Chapt.tex new file mode 100644 index 0000000..38b4d2d --- /dev/null +++ b/Examples_Chapt.tex @@ -0,0 +1,9 @@ + +\chapter*{Examples} +\label{chap:examples} +The following are examples of the OpenMP API directives, constructs, and routines. +\ccppspecificstart +A statement following a directive is compound only when necessary, and a +non-compound statement is indented with respect to a directive preceding it. +\ccppspecificend + diff --git a/Examples_affinity.tex b/Examples_affinity.tex new file mode 100644 index 0000000..a5029cb --- /dev/null +++ b/Examples_affinity.tex @@ -0,0 +1,243 @@ +\pagebreak +\chapter{The \code{proc\_bind} Clause} +\label{chap:affinity} + +The following examples demonstrate how to use the \code{proc\_bind} clause to +control the thread binding for a team of threads in a \code{parallel} region. +The machine architecture is depicted in the figure below. It consists of two sockets, +each equipped with a quad-core processor and configured to execute two hardware +threads simultaneously on each core. These examples assume a contiguous core numbering +starting from 0, such that the hardware threads 0,1 form the first physical core. + +\ifpdf +%\begin{figure}[htbp] +\centerline{\includegraphics[width=3.8in,keepaspectratio=true]% +{figs/proc_bind_fig.pdf}} +%\end{figure} +\fi + +The following equivalent place list declarations consist of eight places (which +we designate as p0 to p7): + +\code{OMP\_PLACES=\texttt{"}\{0,1\},\{2,3\},\{4,5\},\{6,7\},\{8,9\},\{10,11\},\{12,13\},\{14,15\}\texttt{"}} + +or + +\code{OMP\_PLACES=\texttt{"}\{0:2\}:8:2\texttt{"}} + +\section{Spread Affinity Policy} + +The following example shows the result of the \code{spread} affinity policy on +the partition list when the number of threads is less than or equal to the number +of places in the parent's place partition, for the machine architecture depicted +above. Note that the threads are bound to the first place of each subpartition. + +\cexample{affinity}{1c} + +\fexample{affinity}{1f} + +It is unspecified on which place the master thread is initially started. If the +master thread is initially started on p0, the following placement of threads will +be applied in the parallel region: + +\begin{compactitem} +\item thread 0 executes on p0 with the place partition p0,p1 + +\item thread 1 executes on p2 with the place partition p2,p3 + +\item thread 2 executes on p4 with the place partition p4,p5 + +\item thread 3 executes on p6 with the place partition p6,p7 +\end{compactitem} + + +If the master thread would initially be started on p2, the placement of threads +and distribution of the place partition would be as follows: + +\begin{compactitem} +\item thread 0 executes on p2 with the place partition p2,p3 + +\item thread 1 executes on p4 with the place partition p4,p5 + +\item thread 2 executes on p6 with the place partition p6,p7 + +\item thread 3 executes on p0 with the place partition p0,p1 +\end{compactitem} + +The following example illustrates the \code{spread} thread affinity policy when +the number of threads is greater than the number of places in the parent's place +partition. + +Let \plc{T} be the number of threads in the team, and \plc{P} be the number of places in the +parent's place partition. The first \plc{T/P} threads of the team (including the master +thread) execute on the parent's place. The next \plc{T/P} threads execute on the next +place in the place partition, and so on, with wrap around. + +\cexample{affinity}{2c} + +\fexample{affinity}{2f} + +It is unspecified on which place the master thread is initially started. If the +master thread is initially started on p0, the following placement of threads will +be applied in the parallel region: + +\begin{compactitem} +\item threads 0,1 execute on p0 with the place partition p0 + +\item threads 2,3 execute on p1 with the place partition p1 + +\item threads 4,5 execute on p2 with the place partition p2 + +\item threads 6,7 execute on p3 with the place partition p3 + +\item threads 8,9 execute on p4 with the place partition p4 + +\item threads 10,11 execute on p5 with the place partition p5 + +\item threads 12,13 execute on p6 with the place partition p6 + +\item threads 14,15 execute on p7 with the place partition p7 +\end{compactitem} + +If the master thread would initially be started on p2, the placement of threads +and distribution of the place partition would be as follows: + +\begin{compactitem} +\item threads 0,1 execute on p2 with the place partition p2 + +\item threads 2,3 execute on p3 with the place partition p3 + +\item threads 4,5 execute on p4 with the place partition p4 + +\item threads 6,7 execute on p5 with the place partition p5 + +\item threads 8,9 execute on p6 with the place partition p6 + +\item threads 10,11 execute on p7 with the place partition p7 + +\item threads 12,13 execute on p0 with the place partition p0 + +\item threads 14,15 execute on p1 with the place partition p1 +\end{compactitem} + +\section{Close Affinity Policy} + +The following example shows the result of the \code{close} affinity policy on +the partition list when the number of threads is less than or equal to the number +of places in parent's place partition, for the machine architecture depicted above. +The place partition is not changed by the \code{close} policy. + +\cexample{affinity}{3c} + +\fexample{affinity}{3f} + +It is unspecified on which place the master thread is initially started. If the +master thread is initially started on p0, the following placement of threads will +be applied in the \code{parallel} region: + +\begin{compactitem} +\item thread 0 executes on p0 with the place partition p0-p7 + +\item thread 1 executes on p1 with the place partition p0-p7 + +\item thread 2 executes on p2 with the place partition p0-p7 + +\item thread 3 executes on p3 with the place partition p0-p7 +\end{compactitem} + +If the master thread would initially be started on p2, the placement of threads +and distribution of the place partition would be as follows: + +\begin{compactitem} +\item thread 0 executes on p2 with the place partition p0-p7 + +\item thread 1 executes on p3 with the place partition p0-p7 + +\item thread 2 executes on p4 with the place partition p0-p7 + +\item thread 3 executes on p5 with the place partition p0-p7 +\end{compactitem} + +The following example illustrates the \code{close} thread affinity policy when +the number of threads is greater than the number of places in the parent's place +partition. + +Let \plc{T} be the number of threads in the team, and \plc{P} be the number of places in the +parent's place partition. The first \plc{T/P} threads of the team (including the master +thread) execute on the parent's place. The next \plc{T/P} threads execute on the next +place in the place partition, and so on, with wrap around. The place partition +is not changed by the \code{close} policy. + +\cexample{affinity}{4c} + +\fexample{affinity}{4f} + +It is unspecified on which place the master thread is initially started. If the +master thread is initially running on p0, the following placement of threads will +be applied in the parallel region: + +\begin{compactitem} +\item threads 0,1 execute on p0 with the place partition p0-p7 + +\item threads 2,3 execute on p1 with the place partition p0-p7 + +\item threads 4,5 execute on p2 with the place partition p0-p7 + +\item threads 6,7 execute on p3 with the place partition p0-p7 + +\item threads 8,9 execute on p4 with the place partition p0-p7 + +\item threads 10,11 execute on p5 with the place partition p0-p7 + +\item threads 12,13 execute on p6 with the place partition p0-p7 + +\item threads 14,15 execute on p7 with the place partition p0-p7 +\end{compactitem} + +If the master thread would initially be started on p2, the placement of threads +and distribution of the place partition would be as follows: + +\begin{compactitem} +\item threads 0,1 execute on p2 with the place partition p0-p7 + +\item threads 2,3 execute on p3 with the place partition p0-p7 + +\item threads 4,5 execute on p4 with the place partition p0-p7 + +\item threads 6,7 execute on p5 with the place partition p0-p7 + +\item threads 8,9 execute on p6 with the place partition p0-p7 + +\item threads 10,11 execute on p7 with the place partition p0-p7 + +\item threads 12,13 execute on p0 with the place partition p0-p7 + +\item threads 14,15 execute on p1 with the place partition p0-p7 +\end{compactitem} + +\section{Master Affinity Policy} + +The following example shows the result of the \code{master} affinity policy on +the partition list for the machine architecture depicted above. The place partition +is not changed by the master policy. + +\cexample{affinity}{5c} + +\fexample{affinity}{5f} + +It is unspecified on which place the master thread is initially started. If the +master thread is initially running on p0, the following placement of threads will +be applied in the parallel region: + +\begin{compactitem} +\item threads 0-3 execute on p0 with the place partition p0-p7 +\end{compactitem} + +If the master thread would initially be started on p2, the placement of threads +and distribution of the place partition would be as follows: + +\begin{compactitem} +\item threads 0-3 execute on p2 with the place partition p0-p7 +\end{compactitem} + + diff --git a/Examples_array_sections.tex b/Examples_array_sections.tex new file mode 100644 index 0000000..f1601ab --- /dev/null +++ b/Examples_array_sections.tex @@ -0,0 +1,35 @@ +\pagebreak +\chapter{Array Sections in Device Constructs} +\label{chap:array_sections} + +The following examples show the usage of array sections in \code{map} clauses +on \code{target} and \code{target} \code{data} constructs. + +This example shows the invalid usage of two seperate sections of the same array +inside of a \code{target} construct. + +\cexample{array_sections}{1c} + +\fexample{array_sections}{1f} + +This example shows the invalid usage of two separate sections of the same array +inside of a \code{target} construct. + +\cexample{array_sections}{2c} + +\fexample{array_sections}{2f} + +This example shows the valid usage of two separate sections of the same array inside +of a \code{target} construct. + +\cexample{array_sections}{3c} + +\fexample{array_sections}{3f} + +This example shows the valid usage of a wholly contained array section of an already +mapped array section inside of a \code{target} construct. + +\cexample{array_sections}{4c} + +\fexample{array_sections}{4f} + diff --git a/Examples_associate.tex b/Examples_associate.tex new file mode 100644 index 0000000..6946e0c --- /dev/null +++ b/Examples_associate.tex @@ -0,0 +1,32 @@ +\pagebreak +\chapter{Fortran \code{ASSOCIATE} Construct} +\fortranspecificstart +\label{chap:associate} + +The following is an invalid example of specifying an associate name on a data-sharing attribute +clause. The constraint in the Data Sharing Attribute Rules section in the OpenMP +4.0 API Specifications states that an associate name preserves the association +with the selector established at the \code{ASSOCIATE} statement. The associate +name \plc{b} is associated with the shared variable \plc{a}. With the predetermined data-sharing +attribute rule, the associate name \plc{b} is not allowed to be specified on the \code{private} +clause. + +\fnexample{associate}{1f} + +In next example, within the \code{parallel} construct, the association name \plc{thread\_id} +is associated with the private copy of \plc{i}. The print statement should output the +unique thread number. + +\fnexample{associate}{2f} + +The following example illustrates the effect of specifying a selector name on a data-sharing +attribute clause. The associate name \plc{u} is associated with \plc{v} and the variable \plc{v} +is specified on the \code{private} clause of the \code{parallel} construct. +The construct association is established prior to the \code{parallel} region. +The association between \plc{u} and the original \plc{v} is retained (see the Data Sharing +Attribute Rules section in the OpenMP 4.0 API Specifications). Inside the \code{parallel} +region, \plc{v} has the value of -1 and \plc{u} has the value of the original \plc{v}. + +\fnexample{associate}{3f} +\fortranspecificend + diff --git a/Examples_async_target.tex b/Examples_async_target.tex new file mode 100644 index 0000000..04c79cd --- /dev/null +++ b/Examples_async_target.tex @@ -0,0 +1,31 @@ +\pagebreak +\chapter{Asynchronous Execution of a \code{target} Region Using Tasks} +\label{chap:async_target} + +The following example shows how the \code{task} and \code{target} constructs +are used to execute multiple \code{target} regions asynchronously. The task that +encounters the \code{task} construct generates an explicit task that contains +a \code{target} region. The thread executing the explicit task encounters a task +scheduling point while waiting for the execution of the \code{target} region +to complete, allowing the thread to switch back to the execution of the encountering +task or one of the previously generated explicit tasks. + +\cexample{async_target}{1c} + +The Fortran version has an interface block that contains the \code{declare} \code{target}. +An identical statement exists in the function declaration (not shown here). + +\fexample{async_target}{1f} + +The following example shows how the \code{task} and \code{target} constructs +are used to execute multiple \code{target} regions asynchronously. The task dependence +ensures that the storage is allocated and initialized on the device before it is +accessed. + +\cexample{async_target}{2c} + +The Fortran example uses allocatable arrays for dynamic memory on the device. + +\fexample{async_target}{2f} + + diff --git a/Examples_atomic.tex b/Examples_atomic.tex new file mode 100644 index 0000000..f92bbf3 --- /dev/null +++ b/Examples_atomic.tex @@ -0,0 +1,44 @@ +\pagebreak +\chapter{The \code{atomic} Construct} +\label{chap:atomic} + +The following example avoids race conditions (simultaneous updates of an element +of \plc{x} by multiple threads) by using the \code{atomic} construct . + +The advantage of using the \code{atomic} construct in this example is that it +allows updates of two different elements of \plc{x} to occur in parallel. If +a \code{critical} construct were used instead, then all updates to elements of +\plc{x} would be executed serially (though not in any guaranteed order). + +Note that the \code{atomic} directive applies only to the statement immediately +following it. As a result, elements of \plc{y} are not updated atomically in +this example. + +\cexample{atomic}{1c} + +\fexample{atomic}{1f} + +The following example illustrates the \code{read} and \code{write} clauses +for the \code{atomic} directive. These clauses ensure that the given variable +is read or written, respectively, as a whole. Otherwise, some other thread might +read or write part of the variable while the current thread was reading or writing +another part of the variable. Note that most hardware provides atomic reads and +writes for some set of properly aligned variables of specific sizes, but not necessarily +for all the variable types supported by the OpenMP API. + +\cexample{atomic}{2c} + +\fexample{atomic}{2f} + +The following example illustrates the \code{capture} clause for the \code{atomic} +directive. In this case the value of a variable is captured, and then the variable +is incremented. These operations occur atomically. This particular example could +be implemented using the fetch-and-add instruction available on many kinds of hardware. +The example also shows a way to implement a spin lock using the \code{capture} + and \code{read} clauses. + +\cexample{atomic}{3c} + +\fexample{atomic}{3f} + + diff --git a/Examples_atomic_restrict.tex b/Examples_atomic_restrict.tex new file mode 100644 index 0000000..7394de3 --- /dev/null +++ b/Examples_atomic_restrict.tex @@ -0,0 +1,25 @@ +\pagebreak +\chapter{Restrictions on the \code{atomic} Construct} +\label{chap:atomic_restrict} + +The following non-conforming examples illustrate the restrictions on the \code{atomic} +construct. + +\cexample{atomic_restrict}{1c} + +\fexample{atomic_restrict}{1f} + +\cexample{atomic_restrict}{2c} + +\fortranspecificstart +The following example is non-conforming because \code{I} and \code{R} reference +the same location but have different types. + +\fnexample{atomic_restrict}{2f} + +Although the following example might work on some implementations, this is also +non-conforming: + +\fnexample{atomic_restrict}{3f} +\fortranspecificend + diff --git a/Examples_barrier_regions.tex b/Examples_barrier_regions.tex new file mode 100644 index 0000000..64b7eef --- /dev/null +++ b/Examples_barrier_regions.tex @@ -0,0 +1,24 @@ +\pagebreak +\chapter{Binding of \code{barrier} Regions} +\label{chap:barrier_regions} + +The binding rules call for a \code{barrier} region to bind to the closest enclosing +\code{parallel} region. + +In the following example, the call from the main program to \plc{sub2} is conforming +because the \code{barrier} region (in \plc{sub3}) binds to the \code{parallel} +region in \plc{sub2}. The call from the main program to \plc{sub1} is conforming +because the \code{barrier} region binds to the \code{parallel} region in subroutine +\plc{sub2}. + +The call from the main program to \plc{sub3} is conforming because the \code{barrier} +region binds to the implicit inactive \code{parallel} region enclosing the sequential +part. Also note that the \code{barrier} region in \plc{sub3} when called from +\plc{sub2} only synchronizes the team of threads in the enclosing \code{parallel} +region and not all the threads created in \plc{sub1}. + +\cexample{barrier_regions}{1c} + +\fexample{barrier_regions}{1f} + + diff --git a/Examples_cancellation.tex b/Examples_cancellation.tex new file mode 100644 index 0000000..7be91e8 --- /dev/null +++ b/Examples_cancellation.tex @@ -0,0 +1,42 @@ +\pagebreak +\chapter{Cancellation Constructs} +\label{chap:cancellation} + +The following example shows how the \code{cancel} directive can be used to terminate +an OpenMP region. Although the \code{cancel} construct terminates the OpenMP +worksharing region, programmers must still track the exception through the pointer +ex and issue a cancellation for the \code{parallel} region if an exception has +been raised. The master thread checks the exception pointer to make sure that the +exception is properly handled in the sequential part. If cancellation of the \code{parallel} +region has been requested, some threads might have executed \code{phase\_1()}. +However, it is guaranteed that none of the threads executed \code{phase\_2()}. + +\cexample{cancellation}{1c} + + +The following example illustrates the use of the \code{cancel} construct in error +handling. If there is an error condition from the \code{allocate} statement, +the cancellation is activated. The encountering thread sets the shared variable +\code{err} and other threads of the binding thread set proceed to the end of +the worksharing construct after the cancellation has been activated. + +\fexample{cancellation}{1f} + +The following example shows how to cancel a parallel search on a binary tree as +soon as the search value has been detected. The code creates a task to descend +into the child nodes of the current tree node. If the search value has been found, +the code remembers the tree node with the found value through an \code{atomic} +write to the result variable and then cancels execution of all search tasks. The +function \code{search\_tree\_parallel} groups all search tasks into a single +task group to control the effect of the \code{cancel taskgroup} directive. The +\plc{level} argument is used to create undeferred tasks after the first ten +levels of the tree. + +\cexample{cancellation}{2c} + + +The following is the equivalent parallel search example in Fortran. + +\fexample{cancellation}{2f} + + diff --git a/Examples_carrays_fpriv.tex b/Examples_carrays_fpriv.tex new file mode 100644 index 0000000..aad4b6d --- /dev/null +++ b/Examples_carrays_fpriv.tex @@ -0,0 +1,37 @@ +\pagebreak +\chapter{C/C++ Arrays in a \code{firstprivate} Clause} +\ccppspecificstart +\label{chap:carrays_fpriv} + +The following example illustrates the size and value of list items of array or +pointer type in a \code{firstprivate} clause . The size of new list items is +based on the type of the corresponding original list item, as determined by the +base language. + +In this example: + +\begin{compactitem} +\item The type of \code{A} is array of two arrays of two ints. + +\item The type of \code{B} is adjusted to pointer to array of \code{n} +ints, because it is a function parameter. + +\item The type of \code{C} is adjusted to pointer to int, because +it is a function parameter. + +\item The type of \code{D} is array of two arrays of two ints. + +\item The type of \code{E} is array of \code{n} arrays of \code{n} +ints. +\end{compactitem} + +Note that \code{B} and \code{E} involve variable length array types. + +The new items of array type are initialized as if each integer element of the original +array is assigned to the corresponding element of the new array. Those of pointer +type are initialized as if by assignment from the original item to the new item. + +\cnexample{carrays_fpriv}{1c} +\ccppspecificend + + diff --git a/Examples_collapse.tex b/Examples_collapse.tex new file mode 100644 index 0000000..6fd4dfd --- /dev/null +++ b/Examples_collapse.tex @@ -0,0 +1,77 @@ +\pagebreak +\chapter{The \code{collapse} Clause} +\label{chap:collapse} + +In the following example, the \code{k} and \code{j} loops are associated with +the loop construct. So the iterations of the \code{k} and \code{j} loops are +collapsed into one loop with a larger iteration space, and that loop is then divided +among the threads in the current team. Since the \code{i} loop is not associated +with the loop construct, it is not collapsed, and the \code{i} loop is executed +sequentially in its entirety in every iteration of the collapsed \code{k} and +\code{j} loop. + +The variable \code{j} can be omitted from the \code{private} clause when the +\code{collapse} clause is used since it is implicitly private. However, if the +\code{collapse} clause is omitted then \code{j} will be shared if it is omitted +from the \code{private} clause. In either case, \code{k} is implicitly private +and could be omitted from the \code{private} clause. + +\cexample{collapse}{1c} + +\fexample{collapse}{1f} + +In the next example, the \code{k} and \code{j} loops are associated with the +loop construct. So the iterations of the \code{k} and \code{j} loops are collapsed +into one loop with a larger iteration space, and that loop is then divided among +the threads in the current team. + +The sequential execution of the iterations in the \code{k} and \code{j} loops +determines the order of the iterations in the collapsed iteration space. This implies +that in the sequentially last iteration of the collapsed iteration space, \code{k} +will have the value \code{2} and \code{j} will have the value \code{3}. Since +\code{klast} and \code{jlast} are \code{lastprivate}, their values are assigned +by the sequentially last iteration of the collapsed \code{k} and \code{j} loop. +This example prints: \code{2 3}. + +\cexample{collapse}{2c} + +\fexample{collapse}{2f} + +The next example illustrates the interaction of the \code{collapse} and \code{ordered} + clauses. + +In the example, the loop construct has both a \code{collapse} clause and an \code{ordered} +clause. The \code{collapse} clause causes the iterations of the \code{k} and +\code{j} loops to be collapsed into one loop with a larger iteration space, and +that loop is divided among the threads in the current team. An \code{ordered} +clause is added to the loop construct, because an ordered region binds to the loop +region arising from the loop construct. + +According to \$, a thread must not execute more than one ordered region that binds +to the same loop region. So the \code{collapse} clause is required for the example +to be conforming. With the \code{collapse} clause, the iterations of the \code{k} +and \code{j} loops are collapsed into one loop, and therefore only one ordered +region will bind to the collapsed \code{k} and \code{j} loop. Without the \code{collapse} +clause, there would be two ordered regions that bind to each iteration of the \code{k} +loop (one arising from the first iteration of the \code{j} loop, and the other +arising from the second iteration of the \code{j} loop). + +The code prints + +\code{0 1 1} +\\ +\code{0 1 2} +\\ +\code{0 2 1} +\\ +\code{1 2 2} +\\ +\code{1 3 1} +\\ +\code{1 3 2} + +\cexample{collapse}{3c} + +\fexample{collapse}{3f} + + diff --git a/Examples_cond_comp.tex b/Examples_cond_comp.tex new file mode 100644 index 0000000..3f501b6 --- /dev/null +++ b/Examples_cond_comp.tex @@ -0,0 +1,21 @@ +\pagebreak +\chapter{Conditional Compilation} +\label{chap:cond_comp} + +\ccppspecificstart +The following example illustrates the use of conditional compilation using the +OpenMP macro \code{\_OPENMP}. With OpenMP compilation, the \code{\_OPENMP} +macro becomes defined. + +\cnexample{cond_comp}{1c} +\ccppspecificend + +\fortranspecificstart +The following example illustrates the use of the conditional compilation sentinel. +With OpenMP compilation, the conditional compilation sentinel \code{!\$} is recognized +and treated as two spaces. In fixed form source, statements guarded by the sentinel +must start after column 6. + +\fnexample{cond_comp}{1f} +\fortranspecificend + diff --git a/Examples_copyin.tex b/Examples_copyin.tex new file mode 100644 index 0000000..5eb1496 --- /dev/null +++ b/Examples_copyin.tex @@ -0,0 +1,13 @@ +\pagebreak +\chapter{The \code{copyin} Clause} +\label{chap:copyin} + +The \code{copyin} clause is used to initialize threadprivate data upon entry +to a \code{parallel} region. The value of the threadprivate variable in the master +thread is copied to the threadprivate variable of each other team member. + +\cexample{copyin}{1c} + +\fexample{copyin}{1f} + + diff --git a/Examples_copyprivate.tex b/Examples_copyprivate.tex new file mode 100644 index 0000000..6d91618 --- /dev/null +++ b/Examples_copyprivate.tex @@ -0,0 +1,51 @@ +\pagebreak +\chapter{The \code{copyprivate} Clause} +\label{chap:copyprivate} + +The \code{copyprivate} clause can be used to broadcast values acquired by a single +thread directly to all instances of the private variables in the other threads. +In this example, if the routine is called from the sequential part, its behavior +is not affected by the presence of the directives. If it is called from a \code{parallel} +region, then the actual arguments with which \code{a} and \code{b} are associated +must be private. + +The thread that executes the structured block associated with the \code{single} + construct broadcasts the values of the private variables \code{a}, \code{b}, +\code{x}, and +\code{y} from its implicit task's data environment to the data environments +of the other implicit tasks in the thread team. The broadcast completes before +any of the threads have left the barrier at the end of the construct. + +\cexample{copyprivate}{1c} + +\fexample{copyprivate}{1f} + +In this example, assume that the input must be performed by the master thread. +Since the \code{master} construct does not support the \code{copyprivate} clause, +it cannot broadcast the input value that is read. However, \code{copyprivate} +is used to broadcast an address where the input value is stored. + +\cexample{copyprivate}{2c} + +\fexample{copyprivate}{2f} + +Suppose that the number of lock variables required within a \code{parallel} region +cannot easily be determined prior to entering it. The \code{copyprivate} clause +can be used to provide access to shared lock variables that are allocated within +that \code{parallel} region. + +\cexample{copyprivate}{3c} + +\fortranspecificstart +\fnexample{copyprivate}{3f} + +Note that the effect of the \code{copyprivate} clause on a variable with the +\code{allocatable} attribute is different than on a variable with the \code{pointer} +attribute. The value of \code{A} is copied (as if by intrinsic assignment) and +the pointer \code{B} is copied (as if by pointer assignment) to the corresponding +list items in the other implicit tasks belonging to the \code{parallel} region. + +\fnexample{copyprivate}{4f} +\fortranspecificend + + diff --git a/Examples_critical.tex b/Examples_critical.tex new file mode 100644 index 0000000..0e84afc --- /dev/null +++ b/Examples_critical.tex @@ -0,0 +1,16 @@ +\pagebreak +\chapter{The \code{critical} Construct} +\label{chap:critical} + +The following example includes several \code{critical} constructs . The example +illustrates a queuing model in which a task is dequeued and worked on. To guard +against multiple threads dequeuing the same task, the dequeuing operation must +be in a \code{critical} region. Because the two queues in this example are independent, +they are protected by \code{critical} constructs with different names, \plc{xaxis} +and \plc{yaxis}. + +\cexample{critical}{1c} + +\fexample{critical}{1f} + + diff --git a/Examples_declare_target.tex b/Examples_declare_target.tex new file mode 100644 index 0000000..9802b3e --- /dev/null +++ b/Examples_declare_target.tex @@ -0,0 +1,111 @@ +\pagebreak +\chapter{\code{declare} \code{target} Construct} +\label{chap:declare_target} + +\section{\code{declare} \code{target} and \code{end} \code{declare} \code{target} for a Function} + +The following example shows how the \code{declare} \code{target} directive +is used to indicate that the corresponding call inside a \code{target} region +is to a \code{fib} function that can execute on the default target device. + +A version of the function is also available on the host device. When the \code{if} +clause conditional expression on the \code{target} construct evaluates to \plc{false}, +the \code{target} region (thus \code{fib}) will execute on the host device. + +For C/C++ codes the declaration of the function \code{fib} appears between the \code{declare} +\code{target} and \code{end} \code{declare} \code{target} directives. + +\cexample{declare_target}{1c} + +The Fortran \code{fib} subroutine contains a \code{declare} \code{target} declaration +to indicate to the compiler to create an device executable version of the procedure. +The subroutine name has not been included on the \code{declare} \code{target} +directive and is, therefore, implicitly assumed. + +The program uses the \code{module\_fib} module, which presents an explicit interface to +the compiler with the \code{declare} \code{target} declarations for processing +the \code{fib} call. + +\fexample{declare_target}{1f} + +The next Fortran example shows the use of an external subroutine. Without an explicit +interface (through module use or an interface block) the \code{declare} \code{target} +declarations within a external subroutine are unknown to the main program unit; +therefore, a \code{declare} \code{target} must be provided within the program +scope for the compiler to determine that a target binary should be available. + +\fexample{declare_target}{2f} + +\section{\code{declare} \code{target} Construct for Class Type} + +The following example shows how the \code{declare} \code{target} and \code{end} +\code{declare} \code{target} directives are used to enclose the declaration +of a variable \plc{varY} with a class type \code{typeY}. The member function \code{typeY::foo()} cannot +be accessed on a target device because its declaration did not appear between \code{declare} +\code{target} and \code{end} \code{declare} \code{target} directives. + +\cexample{declare_target}{2c} + +\section{\code{declare} \code{target} and \code{end} \code{declare} \code{target} for Variables} + +The following examples show how the \code{declare} \code{target} and \code{end} +\code{declare} \code{target} directives are used to indicate that global variables +are mapped to the implicit device data environment of each target device. + +In the following example, the declarations of the variables \plc{p}, \plc{v1}, and \plc{v2} appear +between \code{declare} \code{target} and \code{end} \code{declare} \code{target} +directives indicating that the variables are mapped to the implicit device data +environment of each target device. The \code{target} \code{update} directive +is then used to manage the consistency of the variables \plc{p}, \plc{v1}, and \plc{v2} between the +data environment of the encountering host device task and the implicit device data +environment of the default target device. + +\cexample{declare_target}{3c} + +The Fortran version of the above C code uses a different syntax. Fortran modules +use a list syntax on the \code{declare} \code{target} directive to declare +mapped variables. + +\fexample{declare_target}{3f} + +The following example also indicates that the function \code{Pfun()} is available on the +target device, as well as the variable \plc{Q}, which is mapped to the implicit device +data environment of each target device. The \code{target} \code{update} directive +is then used to manage the consistency of the variable \plc{Q} between the data environment +of the encountering host device task and the implicit device data environment of +the default target device. + +In the following example, the function and variable declarations appear between +the \code{declare} \code{target} and \code{end} \code{declare} \code{target} +directives. + +\cexample{declare_target}{4c} + +The Fortran version of the above C code uses a different syntax. In Fortran modules +a list syntax on the \code{declare} \code{target} directive is used to declare +mapped variables and procedures. The \plc{N} and \plc{Q} variables are declared as a comma +separated list. When the \code{declare} \code{target} directive is used to +declare just the procedure, the procedure name need not be listed -- it is implicitly +assumed, as illustrated in the \code{Pfun()} function. + +\fexample{declare_target}{4f} + +\section{\code{declare} \code{target} and \code{end} \code{declare} \code{target} with \code{declare} \code{simd}} + +The following example shows how the \code{declare} \code{target} and \code{end} +\code{declare} \code{target} directives are used to indicate that a function +is available on a target device. The \code{declare} \code{simd} directive indicates +that there is a SIMD version of the function \code{P()} that is available on the target +device as well as one that is available on the host device. + +\cexample{declare_target}{5c} + +The Fortran version of the above C code uses a different syntax. Fortran modules +use a list syntax of the \code{declare} \code{target} declaration for the mapping. +Here the \plc{N} and \plc{Q} variables are declared in the list form as a comma separated list. +The function declaration does not use a list and implicitly assumes the function +name. In this Fortran example row and column indices are reversed relative to the +C/C++ example, as is usual for codes optimized for memory access. + +\fexample{declare_target}{5f} + diff --git a/Examples_default_none.tex b/Examples_default_none.tex new file mode 100644 index 0000000..e745df1 --- /dev/null +++ b/Examples_default_none.tex @@ -0,0 +1,12 @@ +\pagebreak +\chapter{The \code{default(none)} Clause} +\label{chap:default_none} + +The following example distinguishes the variables that are affected by the \code{default(none)} +clause from those that are not. + +\cexample{default_none}{1c} + +\fexample{default_none}{1f} + + diff --git a/Examples_device.tex b/Examples_device.tex new file mode 100644 index 0000000..c09c7f6 --- /dev/null +++ b/Examples_device.tex @@ -0,0 +1,35 @@ +\pagebreak +\chapter{Device Routines} +\label{chap:device} + +\section{\code{omp\_is\_initial\_device} Routine} + +The following example shows how the \code{omp\_is\_initial\_device} runtime library routine +can be used to query if a code is executing on the initial host device or on a +target device. The example then sets the number of threads in the \code{parallel} +region based on where the code is executing. + +\cexample{device}{1c} + +\fexample{device}{1f} + +\section{\code{omp\_get\_num\_devices} Routine} + +The following example shows how the \code{omp\_get\_num\_devices} runtime library routine +can be used to determine the number of devices. + +\cexample{device}{2c} + +\fexample{device}{2f} + +\section{\code{omp\_set\_default\_device} and \\ +\code{omp\_get\_default\_device} Routines} + +The following example shows how the \code{omp\_set\_default\_device} and \code{omp\_get\_default\_device} +runtime library routines can be used to set the default device and determine the +default device respectively. + +\cexample{device}{3c} + +\fexample{device}{3f} + diff --git a/Examples_flush_nolist.tex b/Examples_flush_nolist.tex new file mode 100644 index 0000000..732da9f --- /dev/null +++ b/Examples_flush_nolist.tex @@ -0,0 +1,12 @@ +\pagebreak +\chapter{The \code{flush} Construct without a List} +\label{chap:flush_nolist} + +The following example distinguishes the shared variables affected by a \code{flush} +construct with no list from the shared objects that are not affected: + +\cexample{flush_nolist}{1c} + +\fexample{flush_nolist}{1f} + + diff --git a/Examples_fort_do.tex b/Examples_fort_do.tex new file mode 100644 index 0000000..d0c5fe9 --- /dev/null +++ b/Examples_fort_do.tex @@ -0,0 +1,19 @@ +\pagebreak +\chapter{Fortran Restrictions on the \code{do} Construct} +\label{chap:fort_do} +\fortranspecificstart + +If an \code{end do} directive follows a \plc{do-construct} in which several +\code{DO} statements share a \code{DO} termination statement, then a \code{do} +directive can only be specified for the outermost of these \code{DO} statements. +The following example contains correct usages of loop constructs: + +\fnexample{fort_do}{1f} + +The following example is non-conforming because the matching \code{do} directive +for the \code{end do} does not precede the outermost loop: + +\fnexample{fort_do}{2f} +\fortranspecificend + + diff --git a/Examples_fort_loopvar.tex b/Examples_fort_loopvar.tex new file mode 100644 index 0000000..e32d107 --- /dev/null +++ b/Examples_fort_loopvar.tex @@ -0,0 +1,22 @@ +\pagebreak +\chapter{Fortran Private Loop Iteration Variables} +\label{chap:fort_loopvar} +\fortranspecificstart + +In general loop iteration variables will be private, when used in the \plc{do-loop} +of a \code{do} and \code{parallel do} construct or in sequential loops in a +\code{parallel} construct (see \$ and \$). In the following example of a sequential +loop in a \code{parallel} construct the loop iteration variable \plc{I} will +be private. + +\fnexample{fort_loopvar}{1f} + +In exceptional cases, loop iteration variables can be made shared, as in the following +example: + +\fnexample{fort_loopvar}{2f} + +Note however that the use of shared loop iteration variables can easily lead to +race conditions. +\fortranspecificend + diff --git a/Examples_fort_race.tex b/Examples_fort_race.tex new file mode 100644 index 0000000..25f0a37 --- /dev/null +++ b/Examples_fort_race.tex @@ -0,0 +1,16 @@ +\pagebreak +\chapter{Race Conditions Caused by Implied Copies of Shared Variables in Fortran} +\fortranspecificstart +\label{chap:fort_race} + +The following example contains a race condition, because the shared variable, which +is an array section, is passed as an actual argument to a routine that has an assumed-size +array as its dummy argument. The subroutine call passing an array section argument +may cause the compiler to copy the argument into a temporary location prior to +the call and copy from the temporary location into the original variable when the +subroutine returns. This copying would cause races in the \code{parallel} region. + +\fnexample{fort_race}{1f} +\fortranspecificend + + diff --git a/Examples_fort_sa_private.tex b/Examples_fort_sa_private.tex new file mode 100644 index 0000000..fd50c5b --- /dev/null +++ b/Examples_fort_sa_private.tex @@ -0,0 +1,23 @@ +\pagebreak +\chapter{Fortran Restrictions on Storage Association with the \code{private} Clause} +\fortranspecificstart +\label{chap:fort_sa_private} + +The following non-conforming examples illustrate the implications of the \code{private} +clause rules with regard to storage association. + +\fnexample{fort_sa_private}{1f} + +\fnexample{fort_sa_private}{2f} +% blue line floater at top of this page for "Fortran, cont." +\begin{figure}[t!] +\linewitharrows{-1}{dashed}{Fortran (cont.)}{8em} +\end{figure} + +\fnexample{fort_sa_private}{3f} + +\fnexample{fort_sa_private}{4f} + +\fnexample{fort_sa_private}{5f} +\fortranspecificend + diff --git a/Examples_fort_sp_common.tex b/Examples_fort_sp_common.tex new file mode 100644 index 0000000..d5af05d --- /dev/null +++ b/Examples_fort_sp_common.tex @@ -0,0 +1,38 @@ +\pagebreak +\chapter{Fortran Restrictions on \code{shared} and \code{private} Clauses with Common Blocks} +\fortranspecificstart +\label{chap:fort_sp_common} + +When a named common block is specified in a \code{private}, \code{firstprivate}, +or \code{lastprivate} clause of a construct, none of its members may be declared +in another data-sharing attribute clause on that construct. The following examples +illustrate this point. + +The following example is conforming: + +\fnexample{fort_sp_common}{1f} + +The following example is also conforming: + +\fnexample{fort_sp_common}{2f} +% blue line floater at top of this page for "Fortran, cont." +\begin{figure}[t!] +\linewitharrows{-1}{dashed}{Fortran (cont.)}{8em} +\end{figure} + +The following example is conforming: + +\fnexample{fort_sp_common}{3f} + +The following example is non-conforming because \code{x} is a constituent element +of \code{c}: + +\fnexample{fort_sp_common}{4f} + +The following example is non-conforming because a common block may not be declared +both shared and private: + +\fnexample{fort_sp_common}{5f} +\fortranspecificend + + diff --git a/Examples_fpriv_sections.tex b/Examples_fpriv_sections.tex new file mode 100644 index 0000000..2102263 --- /dev/null +++ b/Examples_fpriv_sections.tex @@ -0,0 +1,18 @@ +\pagebreak +\chapter{The \code{firstprivate} Clause and the \code{sections} Construct} +\label{chap:fpriv_sections} + +In the following example of the \code{sections} construct the \code{firstprivate} +clause is used to initialize the private copy of \code{section\_count} of each +thread. The problem is that the \code{section} constructs modify \code{section\_count}, +which breaks the independence of the \code{section} constructs. When different +threads execute each section, both sections will print the value 1. When the same +thread executes the two sections, one section will print the value 1 and the other +will print the value 2. Since the order of execution of the two sections in this +case is unspecified, it is unspecified which section prints which value. + +\cexample{fpriv_sections}{1c} + +\fexample{fpriv_sections}{1f} + + diff --git a/Examples_get_nthrs.tex b/Examples_get_nthrs.tex new file mode 100644 index 0000000..35d0049 --- /dev/null +++ b/Examples_get_nthrs.tex @@ -0,0 +1,21 @@ +\pagebreak +\chapter{The \code{omp\_get\_num\_threads} Routine} +\label{chap:get_nthrs} + +In the following example, the \code{omp\_get\_num\_threads} call returns 1 in +the sequential part of the code, so \code{np} will always be equal to 1. To determine +the number of threads that will be deployed for the \code{parallel} region, the +call should be inside the \code{parallel} region. + +\cexample{get_nthrs}{1c} + +\fexample{get_nthrs}{1f} + +The following example shows how to rewrite this program without including a query +for the number of threads: + +\cexample{get_nthrs}{2c} + +\fexample{get_nthrs}{2f} + + diff --git a/Examples_icv.tex b/Examples_icv.tex new file mode 100644 index 0000000..c0d858f --- /dev/null +++ b/Examples_icv.tex @@ -0,0 +1,56 @@ +\pagebreak +\chapter{Internal Control Variables (ICVs)} +\label{chap:icv} + +According to \$, an OpenMP implementation must act as if there are ICVs that control +the behavior of the program. This example illustrates two ICVs, \plc{nthreads-var} +and \plc{max-active-levels-var}. The \plc{nthreads-var} ICV controls the +number of threads requested for encountered parallel regions; there is one copy +of this ICV per task. The \plc{max-active-levels-var} ICV controls the maximum +number of nested active parallel regions; there is one copy of this ICV for the +whole program. + +In the following example, the \plc{nest-var}, \plc{max-active-levels-var}, +\plc{dyn-var}, and \plc{nthreads-var} ICVs are modified through calls to +the runtime library routines \code{omp\_set\_nested},\\ \code{omp\_set\_max\_active\_levels},\code{ +omp\_set\_dynamic}, and \code{omp\_set\_num\_threads} respectively. These ICVs +affect the operation of \code{parallel} regions. Each implicit task generated +by a \code{parallel} region has its own copy of the \plc{nest-var, dyn-var}, +and \plc{nthreads-var} ICVs. + +In the following example, the new value of \plc{nthreads-var} applies only to +the implicit tasks that execute the call to \code{omp\_set\_num\_threads}. There +is one copy of the \plc{max-active-levels-var} ICV for the whole program and +its value is the same for all tasks. This example assumes that nested parallelism +is supported. + +The outer \code{parallel} region creates a team of two threads; each of the threads +will execute one of the two implicit tasks generated by the outer \code{parallel} +region. + +Each implicit task generated by the outer \code{parallel} region calls \code{omp\_set\_num\_threads(3)}, +assigning the value 3 to its respective copy of \plc{nthreads-var}. Then each +implicit task encounters an inner \code{parallel} region that creates a team +of three threads; each of the threads will execute one of the three implicit tasks +generated by that inner \code{parallel} region. + +Since the outer \code{parallel} region is executed by 2 threads, and the inner +by 3, there will be a total of 6 implicit tasks generated by the two inner \code{parallel} +regions. + +Each implicit task generated by an inner \code{parallel} region will execute +the call to\\ \code{omp\_set\_num\_threads(4)}, assigning the value 4 to its respective +copy of \plc{nthreads-var}. + +The print statement in the outer \code{parallel} region is executed by only one +of the threads in the team. So it will be executed only once. + +The print statement in an inner \code{parallel} region is also executed by only +one of the threads in the team. Since we have a total of two inner \code{parallel} +regions, the print statement will be executed twice -- once per inner \code{parallel} +region. + +\cexample{icv}{1c} + +\fexample{icv}{1f} + diff --git a/Examples_init_lock.tex b/Examples_init_lock.tex new file mode 100644 index 0000000..b686992 --- /dev/null +++ b/Examples_init_lock.tex @@ -0,0 +1,11 @@ +\pagebreak +\chapter{The \code{omp\_init\_lock} Routine} +\label{chap:init_lock} + +The following example demonstrates how to initialize an array of locks in a \code{parallel} +region by using \code{omp\_init\_lock}. + +\cexample{init_lock}{1c} + +\fexample{init_lock}{1f} + diff --git a/Examples_lastprivate.tex b/Examples_lastprivate.tex new file mode 100644 index 0000000..b019fe1 --- /dev/null +++ b/Examples_lastprivate.tex @@ -0,0 +1,14 @@ +\pagebreak +\chapter{The \code{lastprivate} Clause} +\label{chap:lastprivate} + +Correct execution sometimes depends on the value that the last iteration of a loop +assigns to a variable. Such programs must list all such variables in a \code{lastprivate} +clause so that the values of the variables are the same as when the loop is executed +sequentially. + +\cexample{lastprivate}{1c} + +\fexample{lastprivate}{1f} + + diff --git a/Examples_lock_owner.tex b/Examples_lock_owner.tex new file mode 100644 index 0000000..0a6dab4 --- /dev/null +++ b/Examples_lock_owner.tex @@ -0,0 +1,23 @@ +\pagebreak +\chapter{Ownership of Locks} +\label{chap:lock_owner} + +Ownership of locks has changed since OpenMP 2.5. In OpenMP 2.5, locks are owned +by threads; so a lock released by the \code{omp\_unset\_lock} routine must be +owned by the same thread executing the routine. With OpenMP 3.0, locks are owned +by task regions; so a lock released by the \code{omp\_unset\_lock} routine in +a task region must be owned by the same task region. + +This change in ownership requires extra care when using locks. The following program +is conforming in OpenMP 2.5 because the thread that releases the lock \code{lck} +in the parallel region is the same thread that acquired the lock in the sequential +part of the program (master thread of parallel region and the initial thread are +the same). However, it is not conforming in OpenMP 3.0 and 3.1, because the task +region that releases the lock \code{lck} is different from the task region that +acquires the lock. + +\cexample{lock_owner}{1c} + +\fexample{lock_owner}{1f} + + diff --git a/Examples_master.tex b/Examples_master.tex new file mode 100644 index 0000000..48de993 --- /dev/null +++ b/Examples_master.tex @@ -0,0 +1,13 @@ +\pagebreak +\chapter{The \code{master} Construct} +\label{chap:master} + +The following example demonstrates the master construct . In the example, the master +keeps track of how many iterations have been executed and prints out a progress +report. The other threads skip the master region without waiting. + +\cexample{master}{1c} + +\fexample{master}{1f} + + diff --git a/Examples_mem_model.tex b/Examples_mem_model.tex new file mode 100644 index 0000000..a7625dd --- /dev/null +++ b/Examples_mem_model.tex @@ -0,0 +1,38 @@ +\pagebreak +\chapter{The OpenMP Memory Model} +\label{chap:mem_model} + +In the following example, at Print 1, the value of \plc{x} could be either 2 +or 5, depending on the timing of the threads, and the implementation of the assignment +to \plc{x}. There are two reasons that the value at Print 1 might not be 5. +First, Print 1 might be executed before the assignment to \plc{x} is executed. +Second, even if Print 1 is executed after the assignment, the value 5 is not guaranteed +to be seen by thread 1 because a flush may not have been executed by thread 0 since +the assignment. + +The barrier after Print 1 contains implicit flushes on all threads, as well as +a thread synchronization, so the programmer is guaranteed that the value 5 will +be printed by both Print 2 and Print 3. + +\cexample{mem_model}{1c} + +\fexample{mem_model}{1f} + +The following example demonstrates why synchronization is difficult to perform +correctly through variables. The value of flag is undefined in both prints on thread +1 and the value of data is only well-defined in the second print. + +\cexample{mem_model}{2c} + +\fexample{mem_model}{2f} + +The next example demonstrates why synchronization is difficult to perform correctly +through variables. Because the \plc{write}(1)-\plc{flush}(1)-\plc{flush}(2)-\plc{read}(2) +sequence cannot be guaranteed in the example, the statements on thread 0 and thread +1 may execute in either order. + +\cexample{mem_model}{3c} + +\fexample{mem_model}{3f} + + diff --git a/Examples_nestable_lock.tex b/Examples_nestable_lock.tex new file mode 100644 index 0000000..89b55e7 --- /dev/null +++ b/Examples_nestable_lock.tex @@ -0,0 +1,11 @@ +\pagebreak +\chapter{Nestable Lock Routines} +\label{chap:nestable_lock} + +The following example demonstrates how a nestable lock can be used to synchronize +updates both to a whole structure and to one of its members. + +\cexample{nestable_lock}{1c} + +\fexample{nestable_lock}{1f} + diff --git a/Examples_nested_loop.tex b/Examples_nested_loop.tex new file mode 100644 index 0000000..fad0077 --- /dev/null +++ b/Examples_nested_loop.tex @@ -0,0 +1,18 @@ +\pagebreak +\chapter{Nested Loop Constructs} +\label{chap:nested_loop} + +The following example of loop construct nesting is conforming because the inner +and outer loop regions bind to different \code{parallel} regions: + +\cexample{nested_loop}{1c} + +\fexample{nested_loop}{1f} + +The following variation of the preceding example is also conforming: + +\cexample{nested_loop}{2c} + +\fexample{nested_loop}{2f} + + diff --git a/Examples_nesting_restrict.tex b/Examples_nesting_restrict.tex new file mode 100644 index 0000000..0eecdea --- /dev/null +++ b/Examples_nesting_restrict.tex @@ -0,0 +1,52 @@ +\pagebreak +\chapter{Restrictions on Nesting of Regions} +\label{chap:nesting_restrict} + +The examples in this section illustrate the region nesting rules. + +The following example is non-conforming because the inner and outer loop regions +are closely nested: + +\cexample{nesting_restrict}{1c} + +\fexample{nesting_restrict}{1f} + +The following orphaned version of the preceding example is also non-conforming: + +\cexample{nesting_restrict}{2c} + +\fexample{nesting_restrict}{2f} + +The following example is non-conforming because the loop and \code{single} regions +are closely nested: + +\cexample{nesting_restrict}{3c} + +\fexample{nesting_restrict}{3f} + +The following example is non-conforming because a \code{barrier} region cannot +be closely nested inside a loop region: + +\cexample{nesting_restrict}{4c} + +\fexample{nesting_restrict}{4f} + +The following example is non-conforming because the \code{barrier} region cannot +be closely nested inside the \code{critical} region. If this were permitted, +it would result in deadlock due to the fact that only one thread at a time can +enter the \code{critical} region: + +\cexample{nesting_restrict}{5c} + +\fexample{nesting_restrict}{5f} + +The following example is non-conforming because the \code{barrier} region cannot +be closely nested inside the \code{single} region. If this were permitted, it +would result in deadlock due to the fact that only one thread executes the \code{single} +region: + +\cexample{nesting_restrict}{6c} + +\fexample{nesting_restrict}{6f} + + diff --git a/Examples_nowait.tex b/Examples_nowait.tex new file mode 100644 index 0000000..ebdcffd --- /dev/null +++ b/Examples_nowait.tex @@ -0,0 +1,28 @@ +\pagebreak +\chapter{The \code{nowait} Clause} +\label{chap:nowait} + +If there are multiple independent loops within a \code{parallel} region, you +can use the \code{nowait} clause to avoid the implied barrier at the end of the +loop construct, as follows: + +\cexample{nowait}{1c} + +\fexample{nowait}{1f} + +In the following example, static scheduling distributes the same logical iteration +numbers to the threads that execute the three loop regions. This allows the \code{nowait} +clause to be used, even though there is a data dependence between the loops. The +dependence is satisfied as long the same thread executes the same logical iteration +numbers in each loop. + +Note that the iteration count of the loops must be the same. The example satisfies +this requirement, since the iteration space of the first two loops is from \code{0} +to \code{n-1} (from \code{1} to \code{N} in the Fortran version), while the +iteration space of the last loop is from \code{1} to \code{n} (\code{2} to +\code{N+1} in the Fortran version). + +\cexample{nowait}{2c} + +\fexample{nowait}{2f} + diff --git a/Examples_nthrs_dynamic.tex b/Examples_nthrs_dynamic.tex new file mode 100644 index 0000000..961a2f3 --- /dev/null +++ b/Examples_nthrs_dynamic.tex @@ -0,0 +1,30 @@ +\pagebreak +\chapter{Interaction Between the \code{num\_threads} Clause and \code{omp\_set\_dynamic}} +\label{chap:nthrs_dynamic} + +The following example demonstrates the \code{num\_threads} clause and the effect +of the \\ +\code{omp\_set\_dynamic} routine on it. + +The call to the \code{omp\_set\_dynamic} routine with argument \code{0} in +C/C++, or \code{.FALSE.} in Fortran, disables the dynamic adjustment of the number +of threads in OpenMP implementations that support it. In this case, 10 threads +are provided. Note that in case of an error the OpenMP implementation is free to +abort the program or to supply any number of threads available. + +\cexample{nthrs_dynamic}{1c} + +\fexample{nthrs_dynamic}{1f} + +The call to the \code{omp\_set\_dynamic} routine with a non-zero argument in +C/C++, or \code{.TRUE.} in Fortran, allows the OpenMP implementation to choose +any number of threads between 1 and 10. + +\cexample{nthrs_dynamic}{2c} + +\fexample{nthrs_dynamic}{2f} + +It is good practice to set the \plc{dyn-var} ICV explicitly by calling the \code{omp\_set\_dynamic} +routine, as its default setting is implementation defined. + + diff --git a/Examples_nthrs_nesting.tex b/Examples_nthrs_nesting.tex new file mode 100644 index 0000000..c5a0334 --- /dev/null +++ b/Examples_nthrs_nesting.tex @@ -0,0 +1,12 @@ +\pagebreak +\chapter{Controlling the Number of Threads on Multiple Nesting Levels} +\label{chap:nthrs_nesting} + +The following examples demonstrate how to use the \code{OMP\_NUM\_THREADS} environment +variable to control the number of threads on multiple nesting levels: + +\cexample{nthrs_nesting}{1c} + +\fexample{nthrs_nesting}{1f} + + diff --git a/Examples_ordered.tex b/Examples_ordered.tex new file mode 100644 index 0000000..d757cfb --- /dev/null +++ b/Examples_ordered.tex @@ -0,0 +1,28 @@ +\pagebreak +\chapter{The \code{ordered} Clause and the \code{ordered} Construct} +\label{chap:ordered} + +Ordered constructs are useful for sequentially ordering the output from work that +is done in parallel. The following program prints out the indices in sequential +order: + +\cexample{ordered}{1c} + +\fexample{ordered}{1f} + +It is possible to have multiple \code{ordered} constructs within a loop region +with the \code{ordered} clause specified. The first example is non-conforming +because all iterations execute two \code{ordered} regions. An iteration of a +loop must not execute more than one \code{ordered} region: + +\cexample{ordered}{2c} + +\fexample{ordered}{2f} + +The following is a conforming example with more than one \code{ordered} construct. +Each iteration will execute only one \code{ordered} region: + +\cexample{ordered}{3c} + +\fexample{ordered}{3f} + diff --git a/Examples_parallel.tex b/Examples_parallel.tex new file mode 100644 index 0000000..06b56db --- /dev/null +++ b/Examples_parallel.tex @@ -0,0 +1,12 @@ +\pagebreak +\chapter{The \code{parallel} Construct} +\label{chap:parallel} + +The \code{parallel} construct can be used in coarse-grain parallel programs. +In the following example, each thread in the \code{parallel} region decides what +part of the global array \plc{x} to work on, based on the thread number: + +\cexample{parallel}{1c} + +\fexample{parallel}{1f} + diff --git a/Examples_ploop.tex b/Examples_ploop.tex new file mode 100644 index 0000000..40e113c --- /dev/null +++ b/Examples_ploop.tex @@ -0,0 +1,11 @@ +\chapter{A Simple Parallel Loop} +\label{chap:ploop} + +The following example demonstrates how to parallelize a simple loop using the parallel +loop construct. The loop iteration variable is private by default, so it is not +necessary to specify it explicitly in a \code{private} clause. + +\cexample{ploop}{1c} + +\fexample{ploop}{1f} + diff --git a/Examples_pra_iterator.tex b/Examples_pra_iterator.tex new file mode 100644 index 0000000..390971a --- /dev/null +++ b/Examples_pra_iterator.tex @@ -0,0 +1,11 @@ +\pagebreak +\chapter{Parallel Random Access Iterator Loop} +\ccppspecificstart +\label{chap:pra_iterator} + +The following example shows a parallel random access iterator loop. + +\cnexample{pra_iterator}{1c} +\ccppspecificend + + diff --git a/Examples_private.tex b/Examples_private.tex new file mode 100644 index 0000000..d25d7fc --- /dev/null +++ b/Examples_private.tex @@ -0,0 +1,31 @@ +\pagebreak +\chapter{The \code{private} Clause} +\label{chap:private} + +In the following example, the values of original list items \plc{i} and \plc{j} +are retained on exit from the \code{parallel} region, while the private list +items \plc{i} and \plc{j} are modified within the \code{parallel} construct. + +\cexample{private}{1c} + +\fexample{private}{1f} + +In the following example, all uses of the variable \plc{a} within the loop construct +in the routine \plc{f} refer to a private list item \plc{a}, while it is +unspecified whether references to \plc{a} in the routine \plc{g} are to a +private list item or the original list item. + +\cexample{private}{2c} + +\fexample{private}{2f} + +The following example demonstrates that a list item that appears in a \code{private} + clause in a \code{parallel} construct may also appear in a \code{private} + clause in an enclosed worksharing construct, which results in an additional private +copy. + +\cexample{private}{3c} + +\fexample{private}{3f} + + diff --git a/Examples_psections.tex b/Examples_psections.tex new file mode 100644 index 0000000..3f96e18 --- /dev/null +++ b/Examples_psections.tex @@ -0,0 +1,13 @@ +\pagebreak +\chapter{The \code{parallel} \code{sections} Construct} +\label{chap:psections} + +In the following example routines \code{XAXIS}, \code{YAXIS}, and \code{ZAXIS} can +be executed concurrently. The first \code{section} directive is optional. Note +that all \code{section} directives need to appear in the \code{parallel sections} +construct. + +\cexample{psections}{1c} + +\fexample{psections}{1f} + diff --git a/Examples_reduction.tex b/Examples_reduction.tex new file mode 100644 index 0000000..ae582f7 --- /dev/null +++ b/Examples_reduction.tex @@ -0,0 +1,60 @@ +\pagebreak +\chapter{The \code{reduction} Clause} +\label{chap:reduction} + +The following example demonstrates the \code{reduction} clause ; note that some +reductions can be expressed in the loop in several ways, as shown for the \code{max} +and \code{min} reductions below: + +\cexample{reduction}{1c} + +\fexample{reduction}{1f} + +A common implementation of the preceding example is to treat it as if it had been +written as follows: + +\cexample{reduction}{2c} + +\fortranspecificstart +\fnexample{reduction}{2f} + +The following program is non-conforming because the reduction is on the +\emph{intrinsic procedure name} \code{MAX} but that name has been redefined to be the variable +named \code{MAX}. +% blue line floater at top of this page for "Fortran, cont." +\begin{figure}[t!] +\linewitharrows{-1}{dashed}{Fortran (cont.)}{8em} +\end{figure} + +\fnexample{reduction}{3f} + +The following conforming program performs the reduction using the +\emph{intrinsic procedure name} \code{MAX} even though the intrinsic \code{MAX} has been renamed +to \code{REN}. + +\fnexample{reduction}{4f} + +The following conforming program performs the reduction using +\plc{intrinsic procedure name} \code{MAX} even though the intrinsic \code{MAX} has been renamed +to \code{MIN}. + +\fnexample{reduction}{5f} +\fortranspecificend + +The following example is non-conforming because the initialization (\code{a = +0}) of the original list item \code{a} is not synchronized with the update of +\code{a} as a result of the reduction computation in the \code{for} loop. Therefore, +the example may print an incorrect value for \code{a}. + +To avoid this problem, the initialization of the original list item \code{a} +should complete before any update of \code{a} as a result of the \code{reduction} +clause. This can be achieved by adding an explicit barrier after the assignment +\code{a = 0}, or by enclosing the assignment \code{a = 0} in a \code{single} +directive (which has an implied barrier), or by initializing \code{a} before +the start of the \code{parallel} region. + +\cexample{reduction}{3c} + +\fexample{reduction}{6f} + + diff --git a/Examples_set_dynamic_nthrs.tex b/Examples_set_dynamic_nthrs.tex new file mode 100644 index 0000000..5938e39 --- /dev/null +++ b/Examples_set_dynamic_nthrs.tex @@ -0,0 +1,24 @@ +\pagebreak +\chapter{The \code{omp\_set\_dynamic} and \\ +\code{omp\_set\_num\_threads} Routines} +\label{chap:set_dynamic_nthrs} + +Some programs rely on a fixed, prespecified number of threads to execute correctly. +Because the default setting for the dynamic adjustment of the number of threads +is implementation defined, such programs can choose to turn off the dynamic threads +capability and set the number of threads explicitly to ensure portability. The +following example shows how to do this using \code{omp\_set\_dynamic}, and \code{omp\_set\_num\_threads}. + +In this example, the program executes correctly only if it is executed by 16 threads. +If the implementation is not capable of supporting 16 threads, the behavior of +this example is implementation defined. Note that the number of threads executing +a \code{parallel} region remains constant during the region, regardless of the +dynamic threads setting. The dynamic threads mechanism determines the number of +threads to use at the start of the \code{parallel} region and keeps it constant +for the duration of the region. + +\cexample{set_dynamic_nthrs}{1c} + +\fexample{set_dynamic_nthrs}{1f} + + diff --git a/Examples_simple_lock.tex b/Examples_simple_lock.tex new file mode 100644 index 0000000..da9b8ca --- /dev/null +++ b/Examples_simple_lock.tex @@ -0,0 +1,19 @@ +\pagebreak +\chapter{Simple Lock Routines} +\label{chap:simple_lock} + +In the following example, the lock routines cause the threads to be idle while +waiting for entry to the first critical section, but to do other work while waiting +for entry to the second. The \code{omp\_set\_lock} function blocks, but the \code{omp\_test\_lock} +function does not, allowing the work in \code{skip} to be done. + +Note that the argument to the lock routines should have type \code{omp\_lock\_t}, +and that there is no need to flush it. + +\cexample{simple_lock}{1c} + +Note that there is no need to flush the lock variable. + +\fexample{simple_lock}{1f} + + diff --git a/Examples_single.tex b/Examples_single.tex new file mode 100644 index 0000000..b2502f8 --- /dev/null +++ b/Examples_single.tex @@ -0,0 +1,18 @@ +\pagebreak +\chapter{The \code{single} Construct} +\label{chap:single} + +The following example demonstrates the \code{single} construct. In the example, +only one thread prints each of the progress messages. All other threads will skip +the \code{single} region and stop at the barrier at the end of the \code{single} +construct until all threads in the team have reached the barrier. If other threads +can proceed without waiting for the thread executing the \code{single} region, +a \code{nowait} clause can be specified, as is done in the third \code{single} +construct in this example. The user must not make any assumptions as to which thread +will execute a \code{single} region. + +\cexample{single}{1c} + +\fexample{single}{1f} + + diff --git a/Examples_standalone.tex b/Examples_standalone.tex new file mode 100644 index 0000000..acdd208 --- /dev/null +++ b/Examples_standalone.tex @@ -0,0 +1,31 @@ +\pagebreak +\chapter{Placement of \code{flush}, \code{barrier}, \code{taskwait} +and \code{taskyield} Directives} +\label{chap:standalone} + +The following example is non-conforming, because the \code{flush}, \code{barrier}, +\code{taskwait}, and \code{taskyield} directives are stand-alone directives +and cannot be the immediate substatement of an \code{if} statement. + +\cexample{standalone}{1c} + +The following example is non-conforming, because the \code{flush}, \code{barrier}, +\code{taskwait}, and \code{taskyield} directives are stand-alone directives +and cannot be the action statement of an \code{if} statement or a labeled branch +target. + +\fexample{standalone}{1f} + +The following version of the above example is conforming because the \code{flush}, +\code{barrier}, \code{taskwait}, and \code{taskyield} directives are enclosed +in a compound statement. + +\cexample{standalone}{2c} + +The following example is conforming because the \code{flush}, \code{barrier}, +\code{taskwait}, and \code{taskyield} directives are enclosed in an \code{if} +construct or follow the labeled branch target. + +\fexample{standalone}{2f} + + diff --git a/Examples_target.tex b/Examples_target.tex new file mode 100644 index 0000000..de906ec --- /dev/null +++ b/Examples_target.tex @@ -0,0 +1,96 @@ +\pagebreak +\chapter{\code{target} Construct} +\label{chap:target} + +\section{\code{target} Construct on \code{parallel} Construct} + +This following example shows how the \code{target} construct offloads a code +region to a target device. The variables \plc{p}, \plc{v1}, \plc{v2}, and \plc{N} are implicitly mapped +to the the target device. + +\cexample{target}{1c} + +\fexample{target}{1f} + +\section{\code{target} Construct with \code{map} Clause} + +This following example shows how the \code{target} construct offloads a code +region to a target device. The variables \plc{p}, \plc{v1} and \plc{v2} are explicitly mapped to the +the target device using the map clause. The variable \plc{N} is implicitly mapped to +the target device. + +\cexample{target}{2c} + +\fexample{target}{2f} + +\section{\code{map} Clause with \code{to}/\code{from} map-types} + +The following example shows how the \code{target} construct offloads a code region +to a target device. In the \code{map} clause, the \code{to} and \code{from} +map-types define the mapping between the original (host) data and the target (device) +data. The \code{to} map-type specifies that the data will only be read on the +device, and the \code{from} map-type specifies that the data will only be written +to on the device. By specifying a guaranteed access on the device, data transfers +can be reduced for the \code{target} region. + +The \code{to} map-type indicates that at the start of the \code{target} region +the variables \plc{v1} and \plc{v2} are initialized with the values of the corresponding variables +on the host device, and at the end of the \code{target} region the variables +\plc{v1} and \plc{v2} are not assigned to their corresponding variables on the host device. + +The \code{from} map-type indicates that at the start of the \code{target} region +the variable \plc{p} is not initialized with the value of the corresponding variable +on the host device, and at the end of the \code{target} region the variable \plc{p} +is assigned to the corresponding variable on the host device. + +\cexample{target}{3c} + +The \code{to} and \code{from} map-types allow programmers to optimize data +motion. Since data for the \plc{v} arrays are not returned, and data for the \plc{p} array +are not transferred to the device, only one-half of the data is moved, compared +to the default behavior of an implicit mapping. + +\fexample{target}{3f} + +\section{\code{map} Clause with Array Sections} + +The following example shows how the \code{target} construct offloads a code region +to a target device. In the \code{map} clause, map-types are used to optimize +the mapping of variables to the target device. Because variables \plc{p}, \plc{v1} and \plc{v2} are +pointers, array section notation must be used to map the arrays. The notation \code{:N} +is equivalent to \code{0:N}. + +\cexample{target}{4c} + +In C, the length of the pointed-to array must be specified. In Fortran the extent +of the array is known and the length need not be specified. A section of the array +can be specified with the usual Fortran syntax, as shown in the following example. +The value 1 is assumed for the lower bound for array section \plc{v2(:N)}. + +\fexample{target}{4f} + +A more realistic situation in which an assumed-size array is passed to \code{vec\_mult} +requires that the length of the arrays be specified, because the compiler does +not know the size of the storage. A section of the array must be specified with +the usual Fortran syntax, as shown in the following example. The value 1 is assumed +for the lower bound for array section \plc{v2(:N)}. + +\fexample{target}{4bf} + +\section{\code{target} Construct with \code{if} Clause} + +The following example shows how the \code{target} construct offloads a code region +to a target device. + +The \code{if} clause on the \code{target} construct indicates that if the variable +\plc{N} is smaller than a given threshold, then the \code{target} region will be executed +by the host device. + +The \code{if} clause on the \code{parallel} construct indicates that if the +variable \plc{N} is smaller than a second threshold then the \code{parallel} region +is inactive. + +\cexample{target}{5c} + +\fexample{target}{5f} + diff --git a/Examples_target_data.tex b/Examples_target_data.tex new file mode 100644 index 0000000..5626523 --- /dev/null +++ b/Examples_target_data.tex @@ -0,0 +1,175 @@ +\pagebreak +\chapter{\code{target} \code{data} Construct} +\label{chap:target_data} + +\section{Simple \code{target} \code{data} Construct} + +This example shows how the \code{target} \code{data} construct maps variables +to a device data environment. The \code{target} \code{data} construct creates +a new device data environment and maps the variables \plc{v1}, \plc{v2}, and \plc{p} to the new device +data environment. The \code{target} construct enclosed in the \code{target} +\code{data} region creates a new device data environment, which inherits the +variables \plc{v1}, \plc{v2}, and \plc{p} from the enclosing device data environment. The variable +\plc{N} is mapped into the new device data environment from the encountering task's data +environment. + +\cexample{target_data}{1c} + +The Fortran code passes a reference and specifies the extent of the arrays in the +declaration. No length information is necessary in the map clause, as is required +with C/C++ pointers. + +\fexample{target_data}{1f} + +\section{\code{target} \code{data} Region Enclosing Multiple \code{target} Regions} + +The following examples show how the \code{target} \code{data} construct maps +variables to a device data environment of a \code{target} region. The \code{target} +\code{data} construct creates a device data environment and encloses \code{target} +regions, which have their own device data environments. The device data environment +of the \code{target} \code{data} region is inherited by the device data environment +of an enclosed \code{target} region. The \code{target} \code{data} construct +is used to create variables that will persist throughout the \code{target} \code{data} +region. + +In the following example the variables \plc{v1} and \plc{v2} are mapped at each \code{target} +construct. Instead of mapping the variable \plc{p} twice, once at each \code{target} +construct, \plc{p} is mapped once by the \code{target} \code{data} construct. + +\cexample{target_data}{2c} + + +The Fortran code uses reference and specifies the extent of the \plc{p}, \plc{v1} and \plc{v2} arrays. +No length information is necessary in the \code{map} clause, as is required with +C/C++ pointers. The arrays \plc{v1} and \plc{v2} are mapped at each \code{target} construct. +Instead of mapping the array \plc{p} twice, once at each target construct, \plc{p} is mapped +once by the \code{target} \code{data} construct. + +\fexample{target_data}{2f} + +In the following example, the variable tmp defaults to \code{tofrom} map-type +and is mapped at each \code{target} construct. The array \plc{Q} is mapped once at +the enclosing \code{target} \code{data} region instead of at each \code{target} +construct. + +\cexample{target_data}{3c} + +In the following example the arrays \plc{v1} and \plc{v2} are mapped at each \code{target} +construct. Instead of mapping the array \plc{Q} twice at each \code{target} construct, +\plc{Q} is mapped once by the \code{target} \code{data} construct. Note, the \plc{tmp} +variable is implicitly remapped for each \code{target} region, mapping the value +from the device to the host at the end of the first \code{target} region, and +from the host to the device for the second \code{target} region. + +\fexample{target_data}{3f} + +\section{\code{target} \code{data} Construct with Orphaned Call} + +The following two examples show how the \code{target} \code{data} construct +maps variables to a device data environment. The \code{target} \code{data} +construct's device data environment encloses the \code{target} construct's device +data environment in the function \code{vec\_mult()}. + +When the type of the variable appearing in an array section is pointer, the pointer +variable and the storage location of the corresponding array section are mapped +to the device data environment. The pointer variable is treated as if it had appeared +in a \code{map} clause with a map-type of \code{alloc}. The array section's +storage location is mapped according to the map-type in the \code{map} clause +(the default map-type is \code{tofrom}). + +The \code{target} construct's device data environment inherits the storage locations +of the array sections \plc{v1[0:N]}, \plc{v2[:n]}, and \plc{p0[0:N]} from the enclosing target data +construct's device data environment. Neither initialization nor assignment is performed +for the array sections in the new device data environment. + +The pointer variables \plc{p1}, \plc{v3}, and \plc{v4} are mapped into the target construct's device +data environment with an implicit map-type of alloc and they are assigned the address +of the storage location associated with their corresponding array sections. Note +that the following pairs of array section storage locations are equivalent (\plc{p0[:N]}, +\plc{p1[:N]}), (\plc{v1[:N]},\plc{v3[:N]}), and (\plc{v2[:N]},\plc{v4[:N]}). + +\cexample{target_data}{4c} + +The Fortran code maps the pointers and storage in an identical manner (same extent, +but uses indices from 1 to \plc{N}). + +The \code{target} construct's device data environment inherits the storage locations +of the arrays \plc{v1}, \plc{v2} and \plc{p0} from the enclosing \code{target} \code{data} constructs's +device data environment. However, in Fortran the associated data of the pointer +is known, and the shape is not required. + +The pointer variables \plc{p1}, \plc{v3}, and \plc{v4} are mapped into the \code{target} construct's +device data environment with an implicit map-type of \code{alloc} and they are +assigned the address of the storage location associated with their corresponding +array sections. Note that the following pair of array storage locations are equivalent +(\plc{p0},\plc{p1}), (\plc{v1},\plc{v3}), and (\plc{v2},\plc{v4}). + +\fexample{target_data}{4f} + + +In the following example, the variables \plc{p1}, \plc{v3}, and \plc{v4} are references to the pointer +variables \plc{p0}, \plc{v1} and \plc{v2} respectively. The \code{target} construct's device data +environment inherits the pointer variables \plc{p0}, \plc{v1}, and \plc{v2} from the enclosing \code{target} +\code{data} construct's device data environment. Thus, \plc{p1}, \plc{v3}, and \plc{v4} are already +present in the device data environment. + +\cexample{target_data}{5c} + +In the following example, the usual Fortran approach is used for dynamic memory. +The \plc{p0}, \plc{v1}, and \plc{v2} arrays are allocated in the main program and passed as references +from one routine to another. In \code{vec\_mult}, \plc{p1}, \plc{v3} and \plc{v4} are references to the +\plc{p0}, \plc{v1}, and \plc{v2} arrays, respectively. The \code{target} construct's device data +environment inherits the arrays \plc{p0}, \plc{v1}, and \plc{v2} from the enclosing target data construct's +device data environment. Thus, \plc{p1}, \plc{v3}, and \plc{v4} are already present in the device +data environment. + +\fexample{target_data}{5f} + +\section{\code{target} \code{data} Construct with \code{if} Clause} + +The following two examples show how the \code{target} \code{data} construct +maps variables to a device data environment. + +In the following example, the if clause on the \code{target} \code{data} construct +indicates that if the variable \plc{N} is smaller than a given threshold, then the \code{target} +\code{data} construct will not create a device data environment. + +The \code{target} constructs enclosed in the \code{target} \code{data} region +must also use an \code{if} clause on the same condition, otherwise the pointer +variable \plc{p} is implicitly mapped with a map-type of \code{tofrom}, but the storage +location for the array section \plc{p[0:N]} will not be mapped in the device data environments +of the \code{target} constructs. + +\cexample{target_data}{6c} + +The \code{if} clauses work the same way for the following Fortran code. The \code{target} +constructs enclosed in the \code{target} \code{data} region should also use +an \code{if} clause with the same condition, so that the \code{target} \code{data} +region and the \code{target} region are either both created for the device, or +are both ignored. + +\fexample{target_data}{6f} + +In the following example, when the \code{if} clause conditional expression on +the \code{target} construct evaluates to \plc{false}, the target region will +execute on the host device. However, the \code{target} \code{data} construct +created an enclosing device data environment that mapped \plc{p[0:N]} to a device data +environment on the default device. At the end of the \code{target} \code{data} +region the array section \plc{p[0:N]} will be assigned from the device data environment +to the corresponding variable in the data environment of the task that encountered +the \code{target} \code{data} construct, resulting in undefined values in \plc{p[0:N]}. + +\cexample{target_data}{7c} + +The \code{if} clauses work the same way for the following Fortran code. When +the \code{if} clause conditional expression on the \code{target} construct +evaluates to \plc{false}, the \code{target} region will execute on the host +device. However, the \code{target} \code{data} construct created an enclosing +device data environment that mapped the \plc{p} array (and \plc{v1} and \plc{v2}) to a device data +environment on the default target device. At the end of the \code{target} \code{data} +region the \plc{p} array will be assigned from the device data environment to the corresponding +variable in the data environment of the task that encountered the \code{target} +\code{data} construct, resulting in undefined values in \plc{p}. + +\fexample{target_data}{7f} + diff --git a/Examples_target_update.tex b/Examples_target_update.tex new file mode 100644 index 0000000..a945d82 --- /dev/null +++ b/Examples_target_update.tex @@ -0,0 +1,53 @@ +\pagebreak +\chapter{\code{target} \code{update} Construct} +\label{chap:target_update} + +\section{Simple \code{target} \code{data} and \code{target} \code{update} Constructs} + +The following example shows how the \code{target} \code{update} construct updates +variables in a device data environment. + +The \code{target} \code{data} construct maps array sections \plc{v1[:N]} and \plc{v2[:N]} +(arrays \plc{v1} and \plc{v2} in the Fortran code) into a device data environment. + +The task executing on the host device encounters the first \code{target} region +and waits for the completion of the region. + +After the execution of the first \code{target} region, the task executing on +the host device then assigns new values to \plc{v1[:N]} and \plc{v2[:N]} (\plc{v1} and \plc{v2} arrays +in Fortran code) in the task's data environment by calling the function \code{init\_again()}. + +The \code{target} \code{update} construct assigns the new values of \plc{v1} and +\plc{v2} from the task's data environment to the corresponding mapped array sections +in the device data environment of the \code{target} \code{data} construct. + +The task executing on the host device then encounters the second \code{target} +region and waits for the completion of the region. + +The second \code{target} region uses the updated values of \plc{v1[:N]} and \plc{v2[:N]}. + +\cexample{target_update}{1c} + +\fexample{target_update}{1f} + +\section{\code{target} \code{update} Construct with \code{if} Clause} + +The following example shows how the \code{target} \code{update} construct updates +variables in a device data environment. + +The \code{target} \code{data} construct maps array sections \plc{v1[:N]} and \plc{v2[:N]} +(arrays \plc{v1} and \plc{v2} in the Fortran code) into a device data environment. In between +the two \code{target} regions, the task executing on the host device conditionally +assigns new values to \plc{v1} and \plc{v2} in the task's data environment. The function \code{maybe\_init\_again()} +returns \plc{true} if new data is written. + +When the conditional expression (the return value of \code{maybe\_init\_again()}) in the +\code{if} clause is \plc{true}, the \code{target} \code{update} construct +assigns the new values of \plc{v1} and \plc{v2} from the task's data environment to the corresponding +mapped array sections in the \code{target} \code{data} construct's device data +environment. + +\cexample{target_update}{2c} + +\fexample{target_update}{2f} + diff --git a/Examples_taskgroup.tex b/Examples_taskgroup.tex new file mode 100644 index 0000000..7913bfb --- /dev/null +++ b/Examples_taskgroup.tex @@ -0,0 +1,20 @@ +\pagebreak +\chapter{The \code{taskgroup} Construct} +\label{chap:taskgroup} + +In this example, tasks are grouped and synchronized using the \code{taskgroup} +construct. + +Initially, one task (the task executing the \code{start\_background\_work()} +call) is created in the \code{parallel} region, and later a parallel tree traversal +is started (the task executing the root of the recursive \code{compute\_tree()} +calls). While synchronizing tasks at the end of each tree traversal, using the +\code{taskgroup} construct ensures that the formerly started background task +does not participate in the synchronization, and is left free to execute in parallel. +This is opposed to the behaviour of the \code{taskwait} construct, which would +include the background tasks in the synchronization. + +\cexample{taskgroup}{1c} + +\fexample{taskgroup}{1f} + diff --git a/Examples_tasking.tex b/Examples_tasking.tex new file mode 100644 index 0000000..f112319 --- /dev/null +++ b/Examples_tasking.tex @@ -0,0 +1,258 @@ +\pagebreak +\chapter{Tasking Constructs} +\label{chap:tasking} + +The following example shows how to traverse a tree-like structure using explicit +tasks. Note that the \code{traverse} function should be called from within a +parallel region for the different specified tasks to be executed in parallel. Also +note that the tasks will be executed in no specified order because there are no +synchronization directives. Thus, assuming that the traversal will be done in post +order, as in the sequential code, is wrong. + +\cexample{tasking}{1c} + +\fexample{tasking}{1f} + +In the next example, we force a postorder traversal of the tree by adding a \code{taskwait} +directive. Now, we can safely assume that the left and right sons have been executed +before we process the current node. + +\cexample{tasking}{2c} + +\fexample{tasking}{2f} + +The following example demonstrates how to use the \code{task} construct to process +elements of a linked list in parallel. The thread executing the \code{single} +region generates all of the explicit tasks, which are then executed by the threads +in the current team. The pointer \plc{p} is \code{firstprivate} by default +on the \code{task} construct so it is not necessary to specify it in a \code{firstprivate} +clause. + +\cexample{tasking}{3c} + +\fexample{tasking}{3f} + +The \code{fib()} function should be called from within a \code{parallel} region +for the different specified tasks to be executed in parallel. Also, only one thread +of the \code{parallel} region should call \code{fib()} unless multiple concurrent +Fibonacci computations are desired. + +\cexample{tasking}{4c} + +\fexample{tasking}{4f} + +Note: There are more efficient algorithms for computing Fibonacci numbers. This +classic recursion algorithm is for illustrative purposes. + +The following example demonstrates a way to generate a large number of tasks with +one thread and execute them with the threads in the team. While generating these +tasks, the implementation may reach its limit on unassigned tasks. If it does, +the implementation is allowed to cause the thread executing the task generating +loop to suspend its task at the task scheduling point in the \code{task} directive, +and start executing unassigned tasks. Once the number of unassigned tasks is sufficiently +low, the thread may resume execution of the task generating loop. + +\cexample{tasking}{5c} +\pagebreak +\fexample{tasking}{5f} + +The following example is the same as the previous one, except that the tasks are +generated in an untied task. While generating the tasks, the implementation may +reach its limit on unassigned tasks. If it does, the implementation is allowed +to cause the thread executing the task generating loop to suspend its task at the +task scheduling point in the \code{task} directive, and start executing unassigned +tasks. If that thread begins execution of a task that takes a long time to complete, +the other threads may complete all the other tasks before it is finished. + +In this case, since the loop is in an untied task, any other thread is eligible +to resume the task generating loop. In the previous examples, the other threads +would be forced to idle until the generating thread finishes its long task, since +the task generating loop was in a tied task. + +\cexample{tasking}{6c} + +\fexample{tasking}{6f} + +The following two examples demonstrate how the scheduling rules illustrated in +\$ affect the usage of \code{threadprivate} variables in tasks. A \code{threadprivate} +variable can be modified by another task that is executed by the same thread. Thus, +the value of a \code{threadprivate} variable cannot be assumed to be unchanged +across a task scheduling point. In untied tasks, task scheduling points may be +added in any place by the implementation. + +A task switch may occur at a task scheduling point. A single thread may execute +both of the task regions that modify \code{tp}. The parts of these task regions +in which \code{tp} is modified may be executed in any order so the resulting +value of \code{var} can be either 1 or 2. + +\cexample{tasking}{7c} + + +\fexample{tasking}{7f} + +In this example, scheduling constraints prohibit a thread in the team from executing +a new task that modifies \code{tp} while another such task region tied to the +same thread is suspended. Therefore, the value written will persist across the +task scheduling point. + +\cexample{tasking}{8c} + + +\fexample{tasking}{8f} + +The following two examples demonstrate how the scheduling rules illustrated in +\$ affect the usage of locks and critical sections in tasks. If a lock is held +across a task scheduling point, no attempt should be made to acquire the same lock +in any code that may be interleaved. Otherwise, a deadlock is possible. + +In the example below, suppose the thread executing task 1 defers task 2. When +it encounters the task scheduling point at task 3, it could suspend task 1 and +begin task 2 which will result in a deadlock when it tries to enter critical region +1. + +\cexample{tasking}{9c} + + +\fexample{tasking}{9f} + +In the following example, \code{lock} is held across a task scheduling point. + However, according to the scheduling restrictions, the executing thread can't +begin executing one of the non-descendant tasks that also acquires \code{lock} before +the task region is complete. Therefore, no deadlock is possible. + +\cexample{tasking}{10c} + + +\fexample{tasking}{10f} + +The following examples illustrate the use of the \code{mergeable} clause in the +\code{task} construct. In this first example, the \code{task} construct has +been annotated with the \code{mergeable} clause. The addition of this clause +allows the implementation to reuse the data environment (including the ICVs) of +the parent task for the task inside \code{foo} if the task is included or undeferred. +Thus, the result of the execution may differ depending on whether the task is merged +or not. Therefore the mergeable clause needs to be used with caution. In this example, +the use of the mergeable clause is safe. As \code{x} is a shared variable the +outcome does not depend on whether or not the task is merged (that is, the task +will always increment the same variable and will always compute the same value +for \code{x}). + +\cexample{tasking}{11c} + +\fexample{tasking}{11f} + +This second example shows an incorrect use of the \code{mergeable} clause. In +this example, the created task will access different instances of the variable +\code{x} if the task is not merged, as \code{x} is \code{firstprivate}, but +it will access the same variable \code{x} if the task is merged. As a result, +the behavior of the program is unspecified and it can print two different values +for \code{x} depending on the decisions taken by the implementation. + +\cexample{tasking}{12c} + +\fexample{tasking}{12f} + +The following example shows the use of the \code{final} clause and the \code{omp\_in\_final} +API call in a recursive binary search program. To reduce overhead, once a certain +depth of recursion is reached the program uses the \code{final} clause to create +only included tasks, which allow additional optimizations. + +The use of the \code{omp\_in\_final} API call allows programmers to optimize +their code by specifying which parts of the program are not necessary when a task +can create only included tasks (that is, the code is inside a \code{final} task). +In this example, the use of a different state variable is not necessary so once +the program reaches the part of the computation that is finalized and copying from +the parent state to the new state is eliminated. The allocation of \code{new\_state} +in the stack could also be avoided but it would make this example less clear. The +\code{final} clause is most effective when used in conjunction with the \code{mergeable} +clause since all tasks created in a \code{final} task region are included tasks +that can be merged if the \code{mergeable} clause is present. + +\cexample{tasking}{13c} + +\fexample{tasking}{13f} + +The following example illustrates the difference between the \code{if} and the +\code{final} clauses. The \code{if} clause has a local effect. In the first +nest of tasks, the one that has the \code{if} clause will be undeferred but +the task nested inside that task will not be affected by the \code{if} clause +and will be created as usual. Alternatively, the \code{final} clause affects +all \code{task} constructs in the \code{final} task region but not the \code{final} +task itself. In the second nest of tasks, the nested tasks will be created as included +tasks. Note also that the conditions for the \code{if} and \code{final} clauses +are usually the opposite. + +\cexample{tasking}{14c} + +\fexample{tasking}{14f} + +\section*{Task Dependences} + +\section{Flow Dependence} + +In this example we show a simple flow dependence expressed using the \code{depend} +clause on the \code{task} construct. + +\cexample{tasking}{15c} + +\fexample{tasking}{15f} + +The program will always print \texttt{"}x = 2\texttt{"}, because the \code{depend} +clauses enforce the ordering of the tasks. If the \code{depend} clauses had been +omitted, then the tasks could execute in any order and the program and the program +would have a race condition. + +\section{Anti-dependence} + +In this example we show an anti-dependence expressed using the \code{depend} +clause on the \code{task} construct. + +\cexample{tasking}{16c} + +\fexample{tasking}{16f} + +The program will always print \texttt{"}x = 1\texttt{"}, because the \code{depend} +clauses enforce the ordering of the tasks. If the \code{depend} clauses had been +omitted, then the tasks could execute in any order and the program would have a +race condition. + +\section{Output Dependence} + +In this example we show an output dependence expressed using the \code{depend} +clause on the \code{task} construct. + +\cexample{tasking}{17c} + +\fexample{tasking}{17f} + +The program will always print \texttt{"}x = 2\texttt{"}, because the \code{depend} +clauses enforce the ordering of the tasks. If the \code{depend} clauses had been +omitted, then the tasks could execute in any order and the program would have a +race condition. + +\section{Concurrent Execution with Dependences} + +In this example we show potentially concurrent execution of tasks using multiple +flow dependences expressed using the \code{depend} clause on the \code{task} +construct. + +\cexample{tasking}{18c} + +\fexample{tasking}{18f} + +The last two tasks are dependent on the first task. However there is no dependence +between the last two tasks, which may execute in any order (or concurrently if +more than one thread is available). Thus, the possible outputs are \texttt{"}x ++ 1 = 3. x + 2 = 4. \texttt{"} and \texttt{"}x + 2 = 4. x + 1 = 3. \texttt{"}. +If the \code{depend} clauses had been omitted, then all of the tasks could execute +in any order and the program would have a race condition. + +\section{Matrix multiplication} + +This example shows a task-based blocked matrix multiplication. Matrices are of +NxN elements, and the multiplication is implemented using blocks of BSxBS elements. + +\cexample{tasking}{19c} + +\fexample{tasking}{19f} + diff --git a/Examples_taskyield.tex b/Examples_taskyield.tex new file mode 100644 index 0000000..8cca5bf --- /dev/null +++ b/Examples_taskyield.tex @@ -0,0 +1,14 @@ +\pagebreak +\chapter{The \code{taskyield} Directive} +\label{chap:taskyield} + +The following example illustrates the use of the \code{taskyield} directive. +The tasks in the example compute something useful and then do some computation +that must be done in a critical region. By using \code{taskyield} when a task +cannot get access to the \code{critical} region the implementation can suspend +the current task and schedule some other task that can do something useful. + +\cexample{taskyield}{1c} + +\fexample{taskyield}{1f} + diff --git a/Examples_teams.tex b/Examples_teams.tex new file mode 100644 index 0000000..a680d09 --- /dev/null +++ b/Examples_teams.tex @@ -0,0 +1,118 @@ +\pagebreak +\chapter{\code{teams} Constructs} +\label{chap:teams} + +\section{\code{target} and \code{teams} Constructs with \code{omp\_get\_num\_teams}\\ +and \code{omp\_get\_team\_num} Routines} + +The following example shows how the \code{target} and \code{teams} constructs +are used to create a league of thread teams that execute a region. The \code{teams} +construct creates a league of at most two teams where the master thread of each +team executes the \code{teams} region. + +The \code{omp\_get\_num\_teams} routine returns the number of teams executing in a \code{teams} +region. The \code{omp\_get\_team\_num} routine returns the team number, which is an integer +between 0 and one less than the value returned by \code{omp\_get\_num\_teams}. The following +example manually distributes a loop across two teams. + +\cexample{teams}{1c} + +\fexample{teams}{1f} + +\section{\code{target}, \code{teams}, and \code{distribute} Constructs} + +The following example shows how the \code{target}, \code{teams}, and \code{distribute} +constructs are used to execute a loop nest in a \code{target} region. The \code{teams} +construct creates a league and the master thread of each team executes the \code{teams} +region. The \code{distribute} construct schedules the subsequent loop iterations +across the master threads of each team. + +The number of teams in the league is less than or equal to the variable \plc{num\_blocks}. +Each team in the league has a number of threads less than or equal to the variable +\plc{block\_threads}. The iterations in the outer loop are distributed among the master +threads of each team. + +When a team's master thread encounters the parallel loop construct before the inner +loop, the other threads in its team are activated. The team executes the \code{parallel} +region and then workshares the execution of the loop. + +Each master thread executing the \code{teams} region has a private copy of the +variable \plc{sum} that is created by the \code{reduction} clause on the \code{teams} construct. +The master thread and all threads in its team have a private copy of the variable +\plc{sum} that is created by the \code{reduction} clause on the parallel loop construct. +The second private \plc{sum} is reduced into the master thread's private copy of \plc{sum} +created by the \code{teams} construct. At the end of the \code{teams} region, +each master thread's private copy of \plc{sum} is reduced into the final \plc{sum} that is +implicitly mapped into the \code{target} region. + +\cexample{teams}{2c} + +\fexample{teams}{2f} + +\section{\code{target} \code{teams}, and Distribute Parallel Loop Constructs} + +The following example shows how the \code{target} \code{teams} and distribute +parallel loop constructs are used to execute a \code{target} region. The \code{target} +\code{teams} construct creates a league of teams where the master thread of each +team executes the \code{teams} region. + +The distribute parallel loop construct schedules the loop iterations across the +master threads of each team and then across the threads of each team. + +\cexample{teams}{3c} + +\fexample{teams}{3f} + +\section{\code{target} \code{teams} and Distribute Parallel Loop +Constructs with Scheduling Clauses} + +The following example shows how the \code{target} \code{teams} and distribute +parallel loop constructs are used to execute a \code{target} region. The \code{teams} +construct creates a league of at most eight teams where the master thread of each +team executes the \code{teams} region. The number of threads in each team is +less than or equal to 16. + +The \code{distribute} parallel loop construct schedules the subsequent loop iterations +across the master threads of each team and then across the threads of each team. + +The \code{dist\_schedule} clause on the distribute parallel loop construct indicates +that loop iterations are distributed to the master thread of each team in chunks +of 1024 iterations. + +The \code{schedule} clause indicates that the 1024 iterations distributed to +a master thread are then assigned to the threads in its associated team in chunks +of 64 iterations. + +\cexample{teams}{4c} + +\fexample{teams}{4f} + +\section{\code{target} \code{teams} and \code{distribute} \code{simd} Constructs} + +The following example shows how the \code{target} \code{teams} and \code{distribute} +\code{simd} constructs are used to execute a loop in a \code{target} region. +The \code{target} \code{teams} construct creates a league of teams where the +master thread of each team executes the \code{teams} region. + +The \code{distribute} \code{simd} construct schedules the loop iterations across +the master thread of each team and then uses SIMD parallelism to execute the iterations. + +\cexample{teams}{5c} + +\fexample{teams}{5f} + +\section{\code{target} \code{teams} and Distribute Parallel Loop SIMD Constructs} + +The following example shows how the \code{target} \code{teams} and the distribute +parallel loop SIMD constructs are used to execute a loop in a \code{target} \code{teams} +region. The \code{target} \code{teams} construct creates a league of teams +where the master thread of each team executes the \code{teams} region. + +The distribute parallel loop SIMD construct schedules the loop iterations across +the master thread of each team and then across the threads of each team where each +thread uses SIMD parallelism. + +\cexample{teams}{6c} + +\fexample{teams}{6f} + diff --git a/Examples_threadprivate.tex b/Examples_threadprivate.tex new file mode 100644 index 0000000..27e582a --- /dev/null +++ b/Examples_threadprivate.tex @@ -0,0 +1,106 @@ +\pagebreak +\chapter{The \code{threadprivate} Directive} +\label{chap:threadprivate} + +The following examples demonstrate how to use the \code{threadprivate} directive + to give each thread a separate counter. + +\cexample{threadprivate}{1c} + +\fexample{threadprivate}{1f} + +\ccppspecificstart +The following example uses \code{threadprivate} on a static variable: + +\cnexample{threadprivate}{2c} + +The following example demonstrates unspecified behavior for the initialization +of a \code{threadprivate} variable. A \code{threadprivate} variable is initialized +once at an unspecified point before its first reference. Because \code{a} is +constructed using the value of \code{x} (which is modified by the statement +\code{x++}), the value of \code{a.val} at the start of the \code{parallel} +region could be either 1 or 2. This problem is avoided for \code{b}, which uses +an auxiliary \code{const} variable and a copy-constructor. + +\cnexample{threadprivate}{3c} +\ccppspecificend + +The following examples show non-conforming uses and correct uses of the \code{threadprivate} +directive. + +\fortranspecificstart +The following example is non-conforming because the common block is not declared +local to the subroutine that refers to it: + +\fnexample{threadprivate}{2f} + +The following example is also non-conforming because the common block is not declared +local to the subroutine that refers to it: + +\fnexample{threadprivate}{3f} + +The following example is a correct rewrite of the previous example: +% blue line floater at top of this page for "Fortran, cont." +\begin{figure}[t!] +\linewitharrows{-1}{dashed}{Fortran (cont.)}{8em} +\end{figure} + +\fnexample{threadprivate}{4f} + +The following is an example of the use of \code{threadprivate} for local variables: + +\fnexample{threadprivate}{5f} +% blue line floater at top of this page for "Fortran, cont." +\begin{figure}[t!] +\linewitharrows{-1}{dashed}{Fortran (cont.)}{8em} +\end{figure} + +The above program, if executed by two threads, will print one of the following +two sets of output: + +\code{a = 11 12 13} +\\ +\code{ptr = 4} +\\ +\code{i = 15} + +\code{A is not allocated} +\\ +\code{ptr = 4} +\\ +\code{i = 5} + +or + +\code{A is not allocated} +\\ +\code{ptr = 4} +\\ +\code{i = 15} + +\code{a = 1 2 3} +\\ +\code{ptr = 4} +\\ +\code{i = 5} + +The following is an example of the use of \code{threadprivate} for module variables: + +\fnexample{threadprivate}{6f} +\fortranspecificend + +\ccppspecificstart +The following example illustrates initialization of \code{threadprivate} variables +for class-type \code{T}. \code{t1} is default constructed, \code{t2} is constructed +taking a constructor accepting one argument of integer type, \code{t3} is copy +constructed with argument \code{f()}: + +\cnexample{threadprivate}{4c} + +The following example illustrates the use of \code{threadprivate} for static +class members. The \code{threadprivate} directive for a static class member must +be placed inside the class definition. + +\cnexample{threadprivate}{5c} +\ccppspecificend + diff --git a/Examples_workshare.tex b/Examples_workshare.tex new file mode 100644 index 0000000..0870f3d --- /dev/null +++ b/Examples_workshare.tex @@ -0,0 +1,76 @@ +\pagebreak +\chapter{The \code{workshare} Construct} +\fortranspecificstart +\label{chap:workshare} + +The following are examples of the \code{workshare} construct. + +In the following example, \code{workshare} spreads work across the threads executing +the \code{parallel} region, and there is a barrier after the last statement. +Implementations must enforce Fortran execution rules inside of the \code{workshare} +block. + +\fnexample{workshare}{1f} + +In the following example, the barrier at the end of the first \code{workshare} +region is eliminated with a \code{nowait} clause. Threads doing \code{CC = +DD} immediately begin work on \code{EE = FF} when they are done with \code{CC += DD}. + +\fnexample{workshare}{2f} +% blue line floater at top of this page for "Fortran, cont." +\begin{figure}[t!] +\linewitharrows{-1}{dashed}{Fortran (cont.)}{8em} +\end{figure} + +The following example shows the use of an \code{atomic} directive inside a \code{workshare} +construct. The computation of \code{SUM(AA)} is workshared, but the update to +\code{R} is atomic. + +\fnexample{workshare}{3f} + +Fortran \code{WHERE} and \code{FORALL} statements are \emph{compound statements}, +made up of a \emph{control} part and a \emph{statement} part. When \code{workshare} +is applied to one of these compound statements, both the control and the statement +parts are workshared. The following example shows the use of a \code{WHERE} statement +in a \code{workshare} construct. + +Each task gets worked on in order by the threads: + +\code{AA = BB} then +\\ +\code{CC = DD} then +\\ +\code{EE .ne. 0} then +\\ +\code{FF = 1 / EE} then +\\ +\code{GG = HH} + +\fnexample{workshare}{4f} +% blue line floater at top of this page for "Fortran, cont." +\begin{figure}[t!] +\linewitharrows{-1}{dashed}{Fortran (cont.)}{8em} +\end{figure} + +In the following example, an assignment to a shared scalar variable is performed +by one thread in a \code{workshare} while all other threads in the team wait. + +\fnexample{workshare}{5f} + +The following example contains an assignment to a private scalar variable, which +is performed by one thread in a \code{workshare} while all other threads wait. +It is non-conforming because the private scalar variable is undefined after the +assignment statement. + +\fnexample{workshare}{6f} + +Fortran execution rules must be enforced inside a \code{workshare} construct. +In the following example, the same result is produced in the following program +fragment regardless of whether the code is executed sequentially or inside an OpenMP +program with multiple threads: + +\fnexample{workshare}{7f} +\fortranspecificend + + diff --git a/Examples_worksharing_critical.tex b/Examples_worksharing_critical.tex new file mode 100644 index 0000000..c3e785d --- /dev/null +++ b/Examples_worksharing_critical.tex @@ -0,0 +1,18 @@ +\pagebreak +\chapter{Worksharing Constructs Inside a \code{critical} Construct} +\label{chap:worksharing_critical} + +The following example demonstrates using a worksharing construct inside a \code{critical} +construct. This example is conforming because the worksharing \code{single} +region is not closely nested inside the \code{critical} region. A single thread +executes the one and only section in the \code{sections} region, and executes +the \code{critical} region. The same thread encounters the nested \code{parallel} +region, creates a new team of threads, and becomes the master of the new team. +One of the threads in the new team enters the \code{single} region and increments +\code{i} by \code{1}. At the end of this example \code{i} is equal to \code{2}. + +\cexample{worksharing_critical}{1c} + +\fexample{worksharing_critical}{1f} + + diff --git a/Introduction_Chapt.tex b/Introduction_Chapt.tex new file mode 100644 index 0000000..c84ef42 --- /dev/null +++ b/Introduction_Chapt.tex @@ -0,0 +1,69 @@ +% This is the introduction for the OpenMP Examples document. +% This is an included file. See the master file (openmp-examples.tex) for more information. +% +% When editing this file: +% +% 1. To change formatting, appearance, or style, please edit openmp.sty. +% +% 2. Custom commands and macros are defined in openmp.sty. +% +% 3. Be kind to other editors -- keep a consistent style by copying-and-pasting to +% create new content. +% +% 4. We use semantic markup, e.g. (see openmp.sty for a full list): +% \code{} % for bold monospace keywords, code, operators, etc. +% \plc{} % for italic placeholder names, grammar, etc. +% +% 5. Other recommendations: +% Use the convenience macros defined in openmp.sty for the minor headers +% such as Comments, Syntax, etc. +% +% To keep items together on the same page, prefer the use of +% \begin{samepage}.... Avoid \parbox for text blocks as it interrupts line numbering. +% When possible, avoid \filbreak, \pagebreak, \newpage, \clearpage unless that's +% what you mean. Use \needspace{} cautiously for troublesome paragraphs. +% +% Avoid absolute lengths and measures in this file; use relative units when possible. +% Vertical space can be relative to \baselineskip or ex units. Horizontal space +% can be relative to \linewidth or em units. +% +% Prefer \emph{} to italicize terminology, e.g.: +% This is a \emph{definition}, not a placeholder. +% This is a \plc{var-name}. +% + +\chapter*{Introduction} +\label{chap:introduction} +This collection of programming examples supplements the OpenMP API for Shared +Memory Parallelization specifications, and is not part of the formal specifications. It +assumes familiarity with the OpenMP specifications, and shares the typographical +conventions used in that document. + +\notestart +\noteheader – This first release of the OpenMP Examples reflects the OpenMP Version 4.0 +specifications. Additional examples are being developed and will be published in future +releases of this document. +\noteend + +The OpenMP API specification provides a model for parallel programming that is +portable across shared memory architectures from different vendors. Compilers from +numerous vendors support the OpenMP API. + +The directives, library routines, and environment variables demonstrated in this +document allow users to create and manage parallel programs while permitting +portability. The directives extend the C, C++ and Fortran base languages with single +program multiple data (SPMD) constructs, tasking constructs, device constructs, +worksharing constructs, and synchronization constructs, and they provide support for +sharing and privatizing data. The functionality to control the runtime environment is +provided by library routines and environment variables. Compilers that support the +OpenMP API often include a command line option to the compiler that activates and +allows interpretation of all OpenMP directives. + +Complete information about the OpenMP API and a list of the compilers that support +the OpenMP API can be found at the OpenMP.org web site + +\code{http://www.openmp.org} + + +% This is the end of introduction.tex of the OpenMP Examples document. + diff --git a/Makefile b/Makefile new file mode 100644 index 0000000..4ddb3af --- /dev/null +++ b/Makefile @@ -0,0 +1,88 @@ +# Makefile for the OpenMP Examples document in LaTex format. +# For more information, see the master document, openmp-examples.tex. + +version=4.0.1ltx +default: openmp-examples.pdf + + +CHAPTERS=Title_Page.tex \ + Introduction_Chapt.tex \ + Examples_Chapt.tex \ + Examples_ploop.tex \ + Examples_mem_model.tex \ + Examples_cond_comp.tex \ + Examples_icv.tex \ + Examples_parallel.tex \ + Examples_nthrs_nesting.tex \ + Examples_nthrs_dynamic.tex \ + Examples_affinity.tex \ + Examples_fort_do.tex \ + Examples_fort_loopvar.tex \ + Examples_nowait.tex \ + Examples_collapse.tex \ + Examples_psections.tex \ + Examples_fpriv_sections.tex \ + Examples_single.tex \ + Examples_tasking.tex \ + Examples_taskgroup.tex \ + Examples_taskyield.tex \ + Examples_workshare.tex \ + Examples_master.tex \ + Examples_critical.tex \ + Examples_worksharing_critical.tex \ + Examples_barrier_regions.tex \ + Examples_atomic.tex \ + Examples_atomic_restrict.tex \ + Examples_flush_nolist.tex \ + Examples_standalone.tex \ + Examples_ordered.tex \ + Examples_cancellation.tex \ + Examples_threadprivate.tex \ + Examples_pra_iterator.tex \ + Examples_fort_sp_common.tex \ + Examples_default_none.tex \ + Examples_fort_race.tex \ + Examples_private.tex \ + Examples_fort_sa_private.tex \ + Examples_carrays_fpriv.tex \ + Examples_lastprivate.tex \ + Examples_reduction.tex \ + Examples_copyin.tex \ + Examples_copyprivate.tex \ + Examples_nested_loop.tex \ + Examples_nesting_restrict.tex \ + Examples_set_dynamic_nthrs.tex \ + Examples_get_nthrs.tex \ + Examples_init_lock.tex \ + Examples_lock_owner.tex \ + Examples_simple_lock.tex \ + Examples_nestable_lock.tex \ + Examples_target.tex \ + Examples_target_data.tex \ + Examples_target_update.tex \ + Examples_declare_target.tex \ + Examples_teams.tex \ + Examples_async_target.tex \ + Examples_array_sections.tex \ + Examples_device.tex \ + Examples_associate.tex + +INTERMEDIATE_FILES=openmp-examples.pdf \ + openmp-examples.toc \ + openmp-examples.idx \ + openmp-examples.aux \ + openmp-examples.ilg \ + openmp-examples.ind \ + openmp-examples.out \ + openmp-examples.log + +openmp-examples.pdf: $(CHAPTERS) openmp.sty openmp-examples.tex openmp-logo.png + rm -f $(INTERMEDIATE_FILES) + pdflatex -interaction=batchmode -file-line-error openmp-examples.tex + pdflatex -interaction=batchmode -file-line-error openmp-examples.tex + pdflatex -interaction=batchmode -file-line-error openmp-examples.tex + cp openmp-examples.pdf openmp-examples-${version}.pdf + +clean: + rm -f $(INTERMEDIATE_FILES) + diff --git a/README b/README new file mode 100644 index 0000000..3948370 --- /dev/null +++ b/README @@ -0,0 +1,3 @@ +This is the OpenMP 4.0 specification in LaTex format. +Please see the master file, openmp-4.0.tex, for more information. + diff --git a/Title_Page.tex b/Title_Page.tex new file mode 100644 index 0000000..a4e557a --- /dev/null +++ b/Title_Page.tex @@ -0,0 +1,42 @@ +%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% +% Title page + + \begin{titlepage} + \begin{flushleft} + \hspace{-6em} \includegraphics[width=0.4\textwidth]{openmp-logo.png} + \end{flushleft} + + \begin{adjustwidth}{-0.75in}{0in} + \begin{center} + \Huge + \textsf{OpenMP\\Application Programming\\Interface} + + % An optional subtitle can go here: + \vspace{0.5in}\textsf{Examples}\vspace{-0.7in} + \normalsize + + \vspace{1.0in} + + \textbf{Version 4.0.1.ltx -- February, 2014} + \end{center} + \end{adjustwidth} + + \vspace{3.0in} + +\begin{adjustwidth}{0pt}{1em}\setlength{\parskip}{0.25\baselineskip}% +Copyright © 1997-2014 OpenMP Architecture Review Board.\\ +Permission to copy without fee all or part of this material is granted, +provided the OpenMP Architecture Review Board copyright notice and +the title of this document appear. Notice is given that copying is by +permission of OpenMP Architecture Review Board.\end{adjustwidth} + + \end{titlepage} + +% Blank page + +\clearpage +\thispagestyle{empty} +\phantom{a} +\emph{This page intentionally left blank} +\vfill + diff --git a/figs/proc_bind_fig.pdf b/figs/proc_bind_fig.pdf new file mode 100644 index 0000000000000000000000000000000000000000..7e77ecb75fcb4d43b6bc37c1656a1c1178be2641 GIT binary patch literal 22804 zcmbrlb9ALkw>=!&>Daby+fF*RZQFLo9d&Hmwr$%^I$!#n_uTv5aq;`(8_C|go~l(f zSJkSqcFmaziM+5V4FfF`6iNTV?ZH{m-OuU%K`3T?dVE_03n*@Gd^%}k8&fAUe3q{& zMSMC@b1Nrfhp$g7eJ5jKV?$dbV|-p-C`Ts;V|{BVH^2+co*3*V#EvJmYco*0vJn%u zl_himKL8GN9sE%IP(3R#`+A82Sp5B~JMqObgQxm>CaRv6;eZ+@mUF_$2lZGLqb|p- zHdmY8E_bNOw}p<+k&ls&xsKl-iLSn$4pm)!TVsiL4_kAE?+BytO4c94MgVr}aCFd0*5xjWb zIx`G-m09x7Cf)2_;&c1F&F8VLj zeJ4dGm@+&jw7vs?2m$KZO&#gEbnP~HfshViumk%Ah4y^V1V546!=nY3qd9kbr0M1E z=2V4;`>vkt^St7HcQw-C0N>TT#WSD$Ga`{3?gy6wH~)?7hD%|^oO6Sn(`bjAB|tq# zst=Y>45Ac$6onN*TQ}&o+D)zG_KS69DvNnO0f>1)gtVZYR^|v$b+U4_AHW@jH!P)q zE_VE=)qI|4MRg@*di$I4HS*#*PciD`TOb`&%R{vg&@w zRu=CZv_Di1!v<0NM#F$Fn$>t*(!U;j#G}PWkhz`V%FPIjLWvR%{EGJPV z1X`5Dcjb1wZ7;87iK^>cYD-~0T1)kSTCm;eR%|1P5lUom!GhTI;>x>`55MafyFk-pR8E#e3-GYsr^ z0WK9oYkvHd0G-zuC1GqL1r7Z8fdCfgy*`dx8YIeqD;)t7T`~S1-og`TMWW3|jNgUi zouvHw!$Vl|v{E5@rDiBRnj|3wGl(NP@ojlz7>@(bzwX6y+v)}a8x|P~The1&UUa({ zH#q3=7gBeUp<>#~te@eQ`P#*M?v&2}^t8@xM~0>9SXh9@B}RX!H65^avGlr{a3Z%w zo+pN|3N{AuxX*3z`T~w>*{=DmKcfKIApdt+pqd1c4{hb*=~A^mu~IeUM|MWECdT3F zDxHZUnBAJW(g?m0{Jt90#go=iKBq%YForY`pl_bDKkA+aVK?6nHEF-`54^F{D(Sqc zmNXdP^Djz=)5s<^fR=kWgqJW>!Cx+ zQp>JZSyeOanfZ(YdOBq`N*W$LB@oSOMIO6fE!Hu@!3$rvC}~!aPzkYs;Ha5jK|l9) zV@H~DTwDwJhrV!M`yiyLhO;sQK1^^jW5LLqD!@y?HFHG-AUOjb=_p zEc+UzP$(?4RdL&By(~pY?srP83DSVlTHQ9|%ihc(`Gn?ggCtWv6po>Nr4IeS=D|kV zCyKAfN!R45slY*Kt*-e9JD4OU%||X7i~Fk%xPglWS%;6_YiX7r#hUP^euyrzOc%=@ zBs6k6_CcNJLfBcEmhK`w3SHlErV==9RIuY>=`UzvsR~k{t%tc6y8lqie4iMDIjWa9 zCbm{>Lnfa`d?J(Q7v^EPN8VKrtJyCooCm+!#{2z^R&)i})c<)_;nHufh;I+zRE2@J z*>>}~&o}4yWNd2J?cAE$CEeu?yxNiS&}Af@>qZrccH~Rxo5$+{L+3%xZ}%)J#(DI) znSwlIQtjUZ3SFNko%&7AI&hb*ko`V*px#z!aLCKl&)2ILvu5*(2Uc+=R*udvtRveSD@^)DV14f^P8H=q8-6kHAtuFtBBv9)13`EDv$OCEP@ zxMRL;=J)LxHWc`^>_%6hP!A%r5od`%yzS#T?KE>knn9z*29PnFfz|^a6vIFqg8}4z zDw5zQSMtT>uj?J1WjKz}jiepmycFy_m0zFx1gi_;5jW1h2zCLDuZ>f!PmGd9-8Yn@ zc9!3}w!6CnKbUK1+vv_GJTNXHN~B#Djl253QsbR$dTi|y5c`jvzNCDsX}6>O!F*xQ z*KA92DfBvZkMv5cGK|$KLcm~1I01!$!@*WJi{}!j*;?0 zD;>0F7__YVh3%S+;tJ_R$seG*9LW+uvOFoa61HuTjjWZ|k^o_)AbO2Roj~?hAw^7+Vs_`o3#1h;90g z5FHd2_>mrmw5<}|REPvsHfqms^ zAZCojQLA+zo|=3*_AP85cJO++-s&Jck322)(_fk9PdMT=)Yu;PHgl2jK$>SVWcK%H z!lQMma*~e+NA9l14AN&hVA=9%?3LFbcq|Ie^E~YmDBzvyqXPr6*TKX^1@U#KbeV*h zmpd@)d>O{1I>Q)aC$un2o9VlB!x-*^s-^w0E@%bvU?Q#W_QU~Y%^QUYjB&R~6)_2V zdwB}1-!beo%Su#vzR@r0p(qhcrAS&SG-bOO_3SuB_e0DG0+-_{g34lstX)z^z|~b} z!O|8VZu`;{>vu|;NZs%PW$Fs7AwwMgbP$=M)Eby?)SW*N7bV8r6A5K4Z!oR}GH{%$ z@A4UBC`;HxU=%4_QS?EQ)1U{HKjwC%uXMcf3ow{RBrgtC`Kb#S@gZuH8L1?l79EhXa>=bwDwp2G$V>*vom3 z!qIN{a{Y)UDC27dM1RK118|j|Y)M`PfGHsT7irRBND;~<5liF#?^rqD7il+Nc1p8PNg*ePTiq5W3108|gLU}S>6(v4+tTi@5 zv$R&VkrmsWc5^Dm(ZB5#(A67dInHB8EsbvXwab*FgaaiUpMQG5Af3yQxIr~-QvFad z*&_wWz!42ih}q=FDUEzgUeC)I;cYqY59R*WRG&Qr9UJhL0u|eKEhrNJ7F^`jg-2&X z;yA;!Nw1-gAS|^`+;nykEU;KHis1DCOFr7nK_1M-ONr|Z87L3xNf@~8O_r%fqFfpK zEg&^tKJscH-S8XHD_Vi@5Dzv|OlU8RhQ)?B15WSz&VJ)McPS9LLNL zXLHbq_KCelW$arxJ5rtKd@Bg@LKUqaq{#><{IR1(kV>&M4ky+_1lWlUikiZ)K24pM zM+lU;3Q>?CsWhpmROEcZ!DUntx44pM0Fs5GrAloOv#N~Os{^3z%%DBlV(C$o(!KnB6+&|c)p6PAPN$KI*s%?>3~JX-(}miu*AUK#OfceQId<)_QUGsF zr{uqU*R~$+SxTCzv?vW8*ASoY9<#*2lR|haWFS+?dBf17%7tLWobZ|c z=Aeqkj<(JYhQ^NgtbbPs+1faLwL9Yf;jLdJRmRxJTwl=E4PTS~tAdH15ubs9RU7Jy zr~V7)PrrZot-OP+p^~u^zUCL0uqZyAvay>JzBWFckgb)igOZ)Tp)vj+8Z6|MnUw$Hhrso9QGw`B5ObT0cm(P4m6LjXRVj(g6;h z$miysGo=COzoqGpACcx-g)@qL!?+B;1pgQ;8fQx+LFv|vT`(?Tx0TM1@@C$M2 zhxx(ru*vI9ozjZ|165L=%ubk_^wfPlObk7mUzKf&2q1}ub(&fHMFsZ7g~sBc*-O{T z7Os!d2hXs_o5~I8`Bb(*RJO*J)p4tNtEAjnS~ z0XPMiRvgHjAEZ`*cNqXmfMFTXCD6hSVBX(j8bmgL)ecMxM6Dav4jRT!j2|kbM~WVB z)88B-;2HrXPoOjowE#X%a1jCPJA}KCfIRy*-~plVID`cLmub>sbjrZeTp@X$dm<;y zRtW9D*Pr0i_{?A*fZjofKY-@+VV40K{Z^{Eupz{H$F_ytP%^>My4Q9jn^Ae;ntIW8 zu&x29gLQioA^3+OfM-P2A+T@9-0TBr-;|U9ZN<`A*;0mx>qQ&Fw_kqDebM=3q zqYh&1g=$3Y7^vzm8c5PF{4o5XDvfr?YJ$Mz{}NDWuu$_$ovfVC1(FppBbugPRWDXg zvpTf~cv=6P3ma~z8)FyS&Zik&i_wOq5~K-!DXPuytPggF^v127a`W3&0DO<*wSgBw zCzLO?FYZ<>-e4D59OQQp%K&(S6ntVUVr2wOh$D!PAjDo~1^;3>C&CZ}_kJw{ikg^Z zfp!UOQrX0B5+THBio_IY_5R8d7KGZQJfs~2i6fjwVh-pU{5o=##5wr7B=8A*@=4^R z-{d5*MFdx5IV4;7-TB>x3Ke0CZRXWWf3#+Om+KJrmh`3*OJqvDOWhl(NGyxDOg>BX zB#}#6N_9=urOhGJCGeH}{p-CMNTG+nN6A0GS~XX6r@ogbSVAN{FWDf>Al)F`AaIvu zK!Kz^!9Sr1Nv?$dq~s$knacIj~aC7lhZE8l}$+MA~|v^ zDldv?W_SxW%6KXai|f=)^JVKMk+l=(a3cAF) zG<`?Ar}0K57o_q6QfLf#hSy?}Ujywf~+6SW6U=1EpFCsDMOr7=k{2|Jk& z4TE-#Hcx}@Fk`>djO`FlYeXBR>t>fbud=)>i8<8JBt z=ymB$4ul<~9P${d07Mi-6`U8E5fTa18KkcVu%|5mk8W0%SZf{?Nbp_AC72tM1x6d? z)e)VRnz@|x+`U=F&Bx6ZgvLNbSg5~EJa%|?SS&IcRSMNrbVO`GWI;?u#8V_yL@HIC zTBB}XH0pa4{x2R>JS-GXVi$*!r`Zju(7p3rsJ%;CCasjZ^Hqn2gOahS$~fH~4SPyl zEIgbogwJr~-jW09%6r`w*8`BH#J144grh;Kqv#v$XXE#Hkkp{spc&!Re(i8WiAo6+ zi9H}Wfrf48THRa!{gR}(q7bd^gtHp3Lb1BoFsZAsSW6|;nRzf6+l|d)XL& z47%tjd@Ou(-FAU+UEerqy;Dy!(9l_#uH4qHI2gapyKQPyJMUE0*Rl6IQ4A0$XXp*Tk6`f_MHQa1|9(C#r=le?mPS>Z&@K=J)pn7 zQ{FdqmUr6PW$LTzD|{h-6F(&uELJ$w8|%ElHNV7G%$CI38=Wv%vu8hK`?38XkDB{|>#?ZR zxxL^nir}=O%y! zGw@t_?5>wk3Z*QS5cfRphbJJt09Dy(b1@)O>eqUB9pl*IIO00eSrg{bHE&4APzg&Z ztIV1rPEIUBP0E&un5~i*(mj`3;gZbya{am4*PnJ6$GdZDAhX?$!%tcj7OG$4>D$&@(iT{ zq8*I8ec6PrNnaNjeK>JP#RjXD&?LUDB0=9_YKJb?zKP)zo;Jhz{#-jy{VlVw#jqJZ ze3R-?xig$^so@^`TB=&NszpNI7xX#yb=C{W4Nu{|B*EKh^GHlrx8mC-*e0mwj9n45 z%$tQXgC{n6&CCPI*^gl&_9bUiq`Cq$zbn<}`eno8_~KzD^KJd@9!c-gG~IN2)x)5T zvAXYR<3L2QMqNb{`+neleDxLW#h??joNP>asJBvTmNu0o0;`qj8Vb-KjA>jtvBMPB zZOOe!cw=y_F1Z+EsFH&-C#1d=CLX4UtIMEm*=VbAIUBR*PGIQn%Y5yebcbNrYufXQ z295dMV#mV5M6#$f1`8#UTm|ykj7j|+qO9B`jKe{}ePj9zgmSY;RvYddv3o;7QMG6t zGd`c^T?|24v=k!>n$OYAG%NgeoQazkKaG+2Q)|@DmbKc|+ckOb{ z%BY;O^0)8&-sE8llPg!4uM@GqL(;3IsP2j6rWu$uFOc!UkD{@c(efLNMO%w zw>73$6<2HW3r}DCr-?{=_=b7MXIplrOMmD6F0m=rEk>K);<5`%F%Y!kwdcVS*5Fwyb+;owqTjVLZ&1;>bZ}0ko4aEUdxSD z{jEh8H?e5HsE66Hrrj`?Jn7Y4tDQhu?|F^qidA*3{A@!%Vwb zoc5|B_fSq5(-Yc0U|Vo`5@jxntfMGuD^;ac6p&t{&5YU$VxcG#%qUX_WWro{Y?z;wY?xfSgrBH0#&>)g0QPSGL)!Y2Y5t@r z26|?;e^Syvb^j%8{jHPyN80-DwEd6F;`qM_Cx5gM=P!+d0iRCF+{p1uDfwH-(EfLJ z|4+L7qm}$EQ3&Zf>08;F{;lCS{v+O~8ap_e+uGpMG0-yqTmL_*$A484{*p!Ll$;Hm z{t|+ezodu1$NiIv|87*%P!ds5qY`j1*SC^U{#!{AHg+_0Ft>BEb%0{{OG^1tXl%Z& zDVW=Qc_O24sAy}gZ}XouqUH{cPC{n-4){!rUw0k!|MkGY_%&HIb0a6SzoyH^4)sUV z`QLsR+1T+}SXlqh*MIc=KS%lxtN#`2KP|oxzs6#r|9brk`%l}SG9%-k0R3tCyY%lC zOiWCFw|x2h$DZvUTd4mM&i^?c|GBt-FSe|{^_N=n-@;&}Z~7JQul4*BCc(diI2u+~ z7JM2eMizWV`Y*p2=;^-%IXa229b#@MU}I`!{N)OrfTQ6bnU8~><&OmP_X7>%muyBS zq;Dr~Y;J1igwOW%olB?WWNfX9&+%m@ZLI$%v`}BOqEr8u3CmaD|1uHBXJ`Hz)y4F$ zNa8aye+5-W-|g?Gzx?>i!>>Cn#*ANneYv3cZ(H)OihuUxzrNhRw#8o(-rtX3QXe}5 zBm37p{~xzv3ccL*lowW>IF2@3TpwHNj8evlnMQ~c;~+r<1tEkT{6VINW$6RMiK%P9 zrvOCc^@H|=Nm@79&{$MNR2bL#0a{5UTZmB9E52E%m_;V9ikj(0K$G5mOs4rQH*LLr z+)V6q9C3_wJZ0WdAGv2clASG9>PnXvM2idSx(SV05b~z63~zpK*4HN1ZhV1MIMnL$ z7=b;h^&}bH`d;g>_i*B12Ss3SeX^S(a>Dom^-^3|ES_qPaob+VR^CRT4c8v)buy{~ z4ZaqLIht={)?$AB64WHtx!};Z>+~rhp`+7L>b#-X0_fg%+7Jo;rj$g(XG`h`DI~y@-ytH z%gd{WMfdVjHxDr%MI`Zf3d=5w(?$<7tvH^})z_T~Z0gGCh0GBzjR?hM;C;uCPD*H4 z0w6KOX|S&MtpJFk%+X5yDn3uUGD>miIad*6DK(5azzIc8H4cVlfla;vkwhpcYoQ7fwQKCSU;o5+o4~pfvb6I5)sD zq`WYnP90P=h8=<(>Q4miTW4N&B*Q1?O{&_;11c$z8WL?QE2M!+OQaL8({U#qN8{GD zA5Kk(#wVxx$g}PO_MENKZ&lUwqID~ML5pjN^#?B+yHX zXGql4bjqEM1SCk64UkA8#n~6AW@Iz!oZ8b0moat;^&ctDq?)QbY1`_Yj-JbwbB1lY z1^oJd2VLQ<;EkBLBvf(CT6D{H3v?@VWBB#T?s@`k!LNk&_weGA_*ry&{ndowH_FRj zTJyx=8rO1lli1gEq1F!m%~6dQ*T>=A&Lxu=5Qc~&h76Ak zu^Wb;Nsome@DZ-sRUAtXd|QGa34m6p6p-+oew(J7%ZQyHd>jCMrAC(fS18U!lng}d zQ>|{@QaC)7Ptb?tzHQBt@Nd$$!r?9c?C8h7^M=WDdJJ0ut{xUl2UvH=RoHVhZTCt$ zi}pmEeyEW66o68|IlwzWcz|y%aR)B6P;GXJ!29$@?Bkpxx+1@+-B-o$5A=Ch5n<4G zB&^0!y5r8H&Z8K39wHUlXqoZ7_v1%mQ43cg7DL2H8T!=ms=!|#=hqxjmstsaKZU{tn z8b9hUj8|DB8+l~bQ0E%g%+@aID2avfU|)N|IrRz@ zhyhY4%+63GWL#noAG+J9DLA)sTS=dk-Y6}XHD9a5?Wi~a;Ro_p1w`u%$mk4QV2hW1 ztyG5}lixRffh(=?J-~R*xIYVc2bck93J`%li2)NFuOj|};2P~f>S((>vGvyPNH^+i~_a7735&d^`48?(n0S@RE1# z%nllSWMxzSPR-=CHTN1;Ckr!2J0US9Y7thYrHF)Ukm2g=hrRwbM^ zTBYO@<Fk1x?F`Cx>i{xH8@HR`G_a-YFkKu zKMZ}cU_K4iCBQFD*ob$=C5xvx5GN-WOZk|(6nqWvLB^x0Sr_{|&@?>6dzSrmYE`3M z2U9IkeEwm&B@Zur+V>|OI~c|*Mh(NA53#|x?2{+;1|8l~zAo<6^pp|dOP+4$2=VJk z($ksQL|MhjuuuSRCxkhQ_jm93u{Z2Vu^cbr<2`GlP?4OzP1a2^4%v0mZ-S{-#K(e6 z65>vfGtx66QSCxb6d30YQ-!ooVPp~~Ghw{kJ=RuabdNPz!Z~B8x4vR%a$!T}OUwPe zgR28GtA}P62KURObQtq3z>}g@Nl@hd3i^80P5ofsRj&X1$}Eyanj-e>F=28>83`H?9uM8onlJ?FW(0DCL+V&Ru=lhZI=(l7 zKJ|Tf&sN_JFJR#$FbB5l#O3rkcH0C=+m&%q<^s!jZ;GCPyeyi6XEiT&5haUzZhfdY z3-5B#ka?{_!Bei#oRWx_-D|((^O-JWEoqv!TWh7&U~Z$;;BnLu3N6iRY$5e;Wk5Tl zPFc-XwrzDlryRPDNpLD5sw&%cCY{q8`W%5akS-oPJrB&a{~39@;)G)^BR+E8$^lcV zH_1&cwAUW;QC;{6WT4&8ltyafu_IlDqv+tvj}^bXK9()uSrKc zGO#xAVh}D|zR=39oT1ML3BU+D74L^lbnUB%2P}K%rKfSqY(Vy)4;yrX;DT&c=H&%(#Sl)JybktZ4$TWx1+uHDsKD1Igi>jE{_Gq5tnS@X{I^u<}_1#qboB z{iA(nhbYk#x@F411$m2UShk`VWOxjLQ-;+ey93>0({olYHmRzSL`CEc&&ei?Y z{aEJ2l<5;ETC85x8a#2!a6~z5|0}{;n6nRv%ijdcW^{G6`Lpl`cw=Zu<^G8jT;xbZ zv58lSy7E{in7I}AaIbJ5Oc}$6bwevT1y`eO`&*?nKOUU-!5r{j7+#`UkIgs}b)-^f zWt^x!SiO^QbBB)2S+ghfsg^O!OX@{m)3^b*RvgN_igs-JIz~_YL;Qt+yD*-qRnl8C z#zFYjV`lh-ef-ich{Q(Pp0n|N^S~@}UA%~xLl@^XuREeQ#d3a4&1u(T$#IB&3V%k> zoao*I^~sKXLk+s=lle)m2@QSMb`I(CZOicd>KuB6>_F1KM5{CbX_hj|qO2Zxi)R+^ zK>DRPvzId!6PNXzncMccW(TEDW1w`?pXYZ)mCv&7{O1k;#xm>mHUAO6>uD@8FmwMU zAX+(8zHN^y$MFX}yA7Lr#`hYRwED1^d^JPk!?^<|*bYc4cQo&)-{MgpMfb+#vsWh= zQ7eOj2IGC|92woe_B?Sk#}~WNJ>#6~T$fW5C^d*flL%10G&WN6ntIt)avo}u!lnZF z0zQeO!m4YT5fcvTqfrJ9TDg>?v9klbVZ1RsEKFEiOkTzDQP|N9$=F+Xb(Xz(j8o|b z32*+5GF&#+KrUSp&ta+UZYewu#a8Xo$y#w8N$CqZgxi=45}Rl{+V_wq%z& z?mn4Ob=DMFBGUu(#aEWb#4J<8!jk%!Nz$>EuzOgP*mt06$`_ScvaYC>4@}oiiJIB9 zWsCtyPJJSkUeVV=W~~@0+k~eAWaZ=>Lf^QFd9k-;$5|M=o~eEN5U>Oy9swW9irl6I zp7IogJJ3Cs>l@}*p!;6z?~;6}iu8d+{*jage2H8mP>;F=@DAv^zLXTY7%$FM%Qs|W{LMd96~yz78CPp)4a$(K=S!U zeJEv;r!Y-s3gi4VM>dRPPF-qertv>hXbF(Aq;3xqr)@F{6gj|OOw5u+kLx?)EvjXfa`|a=j--o z=8rIB#HP+ZD~hr&OLR{q8pKgbFu!A$M2jYfS>(mza@v{zU%y%8g^Sn9Z7YFx3T?A) zb8s}{E1v0oN0yj96t{Mm4Jo{6m|zi#G!Gr%X5h51aW`W)q1W{L?nmN1vw$;7RV?AxanSMXJjEQH$`09_jw6u~dsVw5OhWJMg*qKZt zXZm!r5=dt^@wf75Z9pERXOpq%UAT#~uS=h8h6pvQv|^}+GjrBJ$QvB0Y-h8hioAoz z$<-i<@xh2u1q2Zs(T5|uGX>r|W(WW|AOk8RB0q;~3(O51+gL-E3?rD$hnMo=AAJ$+ z`0KB(w#v;h$`x)Kd=WQ?U-ps8NX*AXxG`eMA|u!%i;)GCqU)K3DfyoPo%p`T@9o}d2G(Q)Evwn zOeoknusxYdh|Z$7-5*W2U#=D!Cd|KeG1JL5EltEM_AtlHH?qMySZ`$7Ce2=W3Dnq_ zVf80mhQlhx<;ECNlZP+X2Yb~(j~{?pDozgN5dQE`h_wJwi@?N8OPWtFDwqr6ATyOW z`K^ogP%wF0Cj9td95^Q)6All@%yYiKY@5`@z-`&4%mz*w+EZ(5%jTO8Tb_b@kQ|7? zjvM16Yh;ixFT{9v1DR)XcaJwGfpwk= zDoS2E!VIiJ>SYk8Bm4Rq% z_D_O-39Y>SkO@Hhkf~i{W4>9xZbo@7l*fhqYIoe!Gnn8AO^si_7oU;mHVy|;prk?@ zwp=1RW*8=KppS$qf#eJaS+znd(zuwwu!r?TiHFkm#>E1P(O)PDAAAb2hCz|yJzu`} zgc>D>G|f0Z@)8#Ep5H6iX3vLu^eesagfp5K)nkRCV?hicP}oo-);XnD&(()st^$8| z**K52R9S7|t%y}tQ&F>Kfr(_>D8<2K$YdSZ!*C)lY;%EO27&SYL~_+D;C-k$XTCT1 ztx?|z%*|OOz-DSP1}4`yame&gAnVG7U7k(k(QN{JNUW+O)UHaUNL58da-ABB&mma) zR{ACi1Mfoqc_({hM;5$wLbt)1!Oyz@j0#OpHsc06Q?8nQ+bY%c{+hiZN&GYTrxQMJ zN{(UQ9gr3PxL^#lkulYp$;zQypACHpDqoqiZkD}@o`GFV8$&(=Jyo-yw!X%(PFfA& zH1_(ijWVmcjf<5Et^(fT=5^Q5rov{;dr!Q(`ECU%57~Ftb>VOcCWg6~>bhk9nPZoE zQN2cnTB5fH&zkw8j9qW>#r~RggVTC*SnTbYcOk&=AWg?;OpVirRz~Ju!j8}eHWOU6 zPDx6UB91DBJ_BoVHpg0Q`Y&s8I9tyb-fgVbs|{z3GHNU}O(oJ*&m-@Z{_~!|z`#|V z&%;vpZ@^nzj;J~Zw{oc)6Yd8f5N?3=Oo{%mJ2&zb+P;<0{D>!Y{vpz(NMBf(q1(diW)t5z2sgGgg3Y9Fj9>X@&2A zVfvFz!T^r>d>3g#@byY}fr|8Z#)$g)Q=X-vD?(ZAjk2UJp^m^j;z&3vA}=KtQ-vWx z`xy80G4tx9#3;*atXXC!N0yg6XQ~3Kz1+ZN<^DlHhmnINW9vfo)S9QnaYMG~D{?aF zVAN}d!-v$TdpNaq?v^gYF)3E`Ug{7sB?Q=v+7WQOt8b1E7R?+|jaaS6P<%NE(V z0V_Dz-++JfmyHed13M@7K~jHYCbkY7m^`fD>I_|Ngljq~)TpcT#C4q+pnT5FHAh_^ z-4um~p5zZ=4pM@{fF}c=o(-}Io+d8_ImdVhJI8;REKOW`YSFdvj=qz-vCer+-zH>$ z+K0s#8e5J|A+jp;yo>IW%2P3|m1CeB*pbg6Lm6WVrA?y_j>j2|EqW|7Y0qVS6T|+^ z;{_&69U913*0S)#s+w`f$HY zI$GFO+FI3hk~B9!5ouKBt-cPY5(somE$k=NZ8j^Mu}F&ag27P(CGRy~e9KtfnTHy+ z>kz*KNVYAf+EuF8`Hsiya`+-<+p-7QI`#2lyUELU(4v-YGwyRUaH9h4Y0Gs#^FY;k zC*1aS+?Lb6eBC=XWo3y0D4Uk?8hH*{)NgJOXP4rqd!%&^k2tEqVk6=Y7oKhnS4OmE zg_{tMlTa5L1S4dnkgUmwNoutvQxGOZ~5~f||X>Mj&+{1ZnX|=RDl$Tw+&n@RC;gZJDu8eud z0z9LEL;6qC^h^YmVtR2Z?L<2@x0XqyASEi=Tr~6H@M4en1Tz~e8`tMtlnhrs@3Y}D z9$G2Osg1Ez>nEopuiLo{xTH2*48PS9H3YB1Iif4w4+KX)EA!UVS)?3LWXl|M6 zC=x6`Xc8pL5gz*z&f|$SY7tEuMoOIkz`I1PdgM+`2*-{E;W7?zT|T710yUg-N~}2!PT{~C4a!R=lth1kVaW=<6f}bkmvm%8S;cmQ z+MrQ=Jh`RFK#ka=Q>WU|n8jj8n{b7$*st zG5pikK<8)HlFk_}dC{FO@x{k!DIP30Xs%DOFDQEK)dxq2X|CbXFB0%0;~zQEbU?5x z6Dt@P1ZYc{sG-!Rp;j)E%6yN|`iKz1;uu>`ElJlO@Y3_X5D7h?hGA02I-%lcjBF+i zrab39lOLrIIA?ePqKRv^bfZbqeXxBrZ@ELn;-QDErp@b@eJ-IxmygRhtYKl7hrlxz za;s?@m(xtg+dp+2hVQLud8aKrg5ak(bTtdD7jdVJU6bWv*|MN+^Kw9Y5Sm)={j5Mm~X!9bnH4U zvi|zciqgei@@|OIf4fdU0(dt;_G0L@|kPWlupu7MixQn=IGmJEN^6Zk0j`TDYBnJwln-Ka$vx zSa3y5XiXT;Np5IfWL#+;teq!%(@Q3MG_l?L9U@H(Yly7Al9sdpY-n#tQHCxc1n&h5)xI?E10$ zqSpEP^CVb!3LbZ*0}FZ@$opuZBq6$d@gmepc@U3jl=PU9HnZ}jF_R5cy0id zrbarnX5pTV5vM+9s=&gi?AQc77Lc5YZ8{|X0Co!L$V!v+(F5qFC!D#Q_cSK$xy+0r){nZL( z#|Yf9ck@uJigm1N(;|Qx$MXmp^YSFuilZX7f82&0ayHP)ozBkh{>Wk^!-6vzfZHrxgXOAFYvYcQS&JE4d+|ol)03W{A&sxRk(3 zytrS-+PAxNF1r@XWz}_UYMG?%+Votj#y%2#n1d%!Gub7#XTqu zjdJ|Z(SsBZyo826HH3I94z(hfTq{M~M;6zL-<~N(uaDn4dz=O)Ne+?)rr z>3ZlO96a|O1qN`lyK>J2&_fn)>gssx=_q9%M>&R)x?Gt`y2i0ZEvTQ$hZlEXR7N$M@&PJJwV)SLNi?c+ zJSemWVF{m${xn063C5@Nbq~+G-+6#Sz0Mq1u%5Z%L=$*scP*nDS|3^vL$I}3me}&P zg?(UjteIlC>%drR{U`1a!zC#}bJotyYaRoAeimTxhQF-hLZ0`SYZrHmv*b&}Q_6IF z!y2pYxa4b>^Le&4-T1V0=X$D8CupcDOUh=o)yZ5bMwL&cR$EqRP>vheV$gKH4jj3F+FcwQ(b6M((;2ZfnQ{!_@6K9F2Y?Or#7n&qVI#wSC{!IvxnG zgYQ1a-kaujetF`K@-i0O5K~#ZN}6+8Ssz#LDSe75)*(*csI_zXBI}5w@iFF|)*8~9 z*yzwE-3dpVC=+p;h+`c7bC1M027>RW_<4=2Sm!SsN5zQ}u8b^eS&pbelL!5sXm)L_ zHue@fDBrabJ2;2lQnZFoVYTw+xk)wb4qg;VfZ?N85LuifPPI*ehhh&wnG!~_87CFR zI?ypl301_Z9TAh_lcOpv>81gw*oEJ-M^^d~M(cQ)-CZrx@%fnE^^s_Q#OIW6UFRR!ww#o- z`Bs1Q!n-P#cpti%d^#XGb~rzyRdqZq63EtZo@1}X)xk_#HC{p|%7c}qro+hm@)$EP z57tjMuNnB!^HA`E6~P;Is8*1h#;(KidDf9v33mq*866SxDm|Tpmw7H2LaungS;$1{ znDqZERh=3ry2MCHvCp4w^E<&V; zbVBcf6zSEQ?K$V(Bx z<>OeUl7Vax_$@HnTKZio&^tT{pw3Z3Zb+997lBPcWK)q}Jhhm@zu$;2BSoWdZ5WLr zi|R`PR)RZuyjFVpe9Pk3qF}0>vx&y9i`VE=dZ!4E7r-sl>)UH1%mMj9HfQ@rT@ zpu6BGJ2Rg>^SKLCb`ch_5kbWQkw%}5>ymOmZ=B{R>G0Z`iss0tG0aqt&*Y>4WO9}; zDmJ(V?-iV1i6LJ2&;DeYj@YD-|D zWOmw(lAAW@W)1)3*%X5#u!dCp)5C9! z9}$3k*-uNi4hmxWgb0NZ3dei0*Z1r#m*ek(k^Em)=`27WvqKH&b`f9!EAXAI;h^49 z)pUcv&Za5@_p`SYWbO>1k$T$d)i0U68Z8a>zekCvxF{(naKzBW&#BMDhhY~m?pk;= z!$6@d+SvBAKlGxiEZ{PV;aHF1==kS;d%oT4_3XjdQ~sE(bGPr(f04?6&Ui;E zp7tPaeLO>Hk3kjs9VqGWAk$xsTh&gD4-~G3R&&XJ6{^Rr#+wX}@#UU{$c$(vy5>Z( z@_jJU+NV^Q<(1~;UNJk(Ejj43vr$@(45Z*PBBJbSxW-@tH7Y?luWF=92F?t9bm0%7 zAbGFUZ_toY{#K&@WCvXfK=-JPe3NRQ#U{*Cw0NswO{Ku{9mUR@+uLbBy${yIDd64< zlB&o-qcdiYnhJpACjn-aRIovYT@rK6Pth!cJISe)$c}!&mPehv8k~>cLGaQfOQT_) z&7L_K^(m3!1)oWRb1-_EFU;&36C1CeD=5Yl4(-Ura$tyzihycql&5`~9-*g74$Y^M z8-r12C2~0rRQsX&d^u{PH5)ZyS(=O^VH^5>ISX1}o%-BXd{T7!%tr@Pgkl&3D<_}T z5z6y?wg$g@3})Qd>&_{Tx`R0-swBQfE=TOX+Wi@tc4AB9FtSwD@e?=3pq)<{)BjGn4X zx1Q{X(UmwThq9ZjcAF7^+hT!FF+P*H`6c`Mn{Om(hkNt07Ks z^VyfVa-SBnj~T<*eysZ$blcM??(p$ztaU2q?qe@JJtbKkM=eN}M$xoHequ?LM7++1 zF80E?6uw`x(lb)@tuNHs?8;w*J~TOVzikE*POcaW2)vT>urbXa9j*cl-;XhYz%@v| z5G380W=@c0;QG4k*2kk#4PX~w&o_biy$r7V*iboL@e^}Du%NtM-Tc|BStUHr?pX?& zR!@(ec#qW3=tulLc<I^*TZi~>}rN@h}hS7oC5M`mBWtaNem9_=1UBz*_s=~g<75KqGZzZl^#Efh0)~7 zngw&sorFy9M~)7}_n634gxSdeNk$?mvm>7-$uL;-DpoyTud_+lwQ5(gcE^8~&1-sb zU~%pyHh19FJ-()j6+vDwWRXlRR>n1t2B`}Mp@qJj_itg zQBdpJ>j7*#=^2i;GgxO=VGNCIM?d`n+66s-&M)-@bke`2;}{SFNz zEF@9Y9AXmGWs|7y&}glxk)=kGQmRaY4+;c~)~V58(| z!iGnsN+NCygZ~Qd4HdAl|Iq0=!bEZghZ_tV%v~MNrwP@B&3s@dB z&7rK9Uh+Zv?og@T?9aGoz}N zjVGAm@@7|T7^zkHzBT53!I&z;zDfJ?x7F&)o>M;EPMxhbJ_=;unSgs4w@=IlpN`rr z7TaBqQawg(_XUhyE-f0|LG>axjw#FegL>>pKKOsE(sn$8GBT;ft|~puss2)ft;1Gf zo3J0S4cIZ3O+m!Xt{-GSUc~gF?9>eb-2l3>=rW8G<~;6{bTc%3jz7r$M0nM7j1?de zY94q6URB)P%+eI9r%zm0ytBi>aki^><0*{e454tapaKZyZc8{-d^SjK}U#Q2<ASW9DhRmk0V%B$;Y?Vb?m;thN^{%nLr1z~w z8scvMXYzH|U?bkvrZ94cwrur!V~R*0Vmz848@7&eG7>8;wu?7^;hDd3G@}ump)Hos zR|vUOR1r-$*d)PQ*!*ibx!L4L6u3LbeLhtLd6f3y+i;Dxe&1!i1jk6{JU>z50pC(d zJZIov%=fdslz%YGjj&kyQW2Cg%;mR?fD|5kU$q@Lyx=_UQqH6U}-%!zlVXqWiIRBb)v+XgTJ(7wte#9$PH+d$_r%oO|G-mwG;8+x0eI z)mBdD{JwwLSW>2c8gNu9japMReuQ)}-abqt*bzHvuE&@)9~~8p6x#@ zZ+bel92>rHlJY3+#7<}pfu5>#Yh+OJ=uE^9UKsyB)vez70*b4vO1e7k+j z^we%iNYz4Nnz4&5A5FP!l=$a~J9nbxF5G4dqf0HUEB*a7t39YNsIT?kE|4XQrK4Y z8I1;%+-un^E0YYs?saSxcsniur27G`1>gEY&TEc??HoaI3Jb^umv_ir3@tLtYY#in zo%6twXyba7Nz%~sVC0qB+gyv4Ux zJ#hYnkM#Wwaj-Ou?zRP^Z0=@>E7@9#!`qUo*1Xo61N_N!=-yHSwQI<0(gE7{?nck7 z4@W-wQOIsJltdW7Z!Q4-_}wPggvE;4sXXy6e}mYlpn0o6WoMtvSGGnRDao8_>E+0V z`zJkIdmblC56fRI&Q%e~GLF#rf`E#8ly@s9?cW>sXMQD()gQNMK%rwUls zD{zb{R7dj1k;JyYnUY-#M9o-LPR5exee74F7VL2=1L+e4%?AOC8?19W9jd3hc1=Xl zqxQOb9}5@VVO!poM_J>}Rg)h>CzDDeqzX`+U;8~%{VFpu0t}m7JD7OUS*TZ^dmjS& zWl-V4oD4&L)RH?=)a`O3VBn#NPBLo)O>jm?(0p+HvV(i`$JPy~CLg;k)@;7#n@&V` z?X15&f8gNH#1Q`4scQLRQ}kln6DqIX-K`g{kGdEwgqC2Lcw0qQGuCySiyd#1VVuiu zmGcqFHkEtl5UX#75q`X!d{>Dxt~fKU#oBd5((|V8Elg#`>8nv$g-tL9oY46h~2V0S@Ax+O*|%d zd{6;z$eYS*oCqA3rS~`-A`M`HAV-MW4?Kp^dCDc7rC&>jDV+NHO4h&VJ+EZM=7`^# zB*^bsJS=Zdbjfd}w$C;f_u*@sE8fH$I6cMV3~G6g7+A9aEUj1ouBh-P>WlkG;%Y*Z zFXnUcyP~qWjkOElR%VNw8s9pb=~7p*Q4g5?Ue6|LZG7&(z7R*Sg5S+u)BT4dsxK9;0!*0&l=?%q}KUyuV5)qsIDWC zi~dNu;p#|@X(EcebxM*Qgi22>j%^=%01EQR%c<{xaUYvBYL&1pbpa)>L`v zPa5{isr;g0U>N*=ZP+jB^LNUFgHUW5I&6kGh$9FS6k*fyvT*nGXTufX{OZ#2_2m7J zCjv@~{_pSqS9s&=ZexqHO<)Ka4h#MJU=tM)5f)*yW&2kK1_R-^JN|vJ zx&Au?3PZs->h^mE!x^1_W-$>MBks82+sEXV-Ae#Hu^^<3jbRm|2`)QhyJl1PA>hK zfkpq!px{5&gTZ0{%)lTx^q^fq{_!dR|X=3!J`k|J9wOa>pLS9J literal 0 HcmV?d00001 diff --git a/figs/proc_bind_fig.png b/figs/proc_bind_fig.png new file mode 100644 index 0000000000000000000000000000000000000000..84206a620c31a70b07ce1af6f17f38dcad07e05b GIT binary patch literal 12942 zcmaKT1yEegwlyByCAd2Qf?IHRcXzkJ-QC?axRVeV++71f2ZBS;;F`>v+}!uw_v+RE z@2XyB_1>-f^z`o2RTHbKEQ5wjgbW1*g(fE}sSX7N;|}51h_Fyl(6Ot>{g4baKwU;0 zs&SU&2P6Y$Bc>z<1=W&_@@fVTu{EeFYDz)$#l^)Cgvi*~7z8ynH6h5#%8H1H2q9Wp zS`hpz$jEFHHgR{pg@kc*28f(8Z#5S*KvgJ5`gI0P{< zF(C+%y1Kf*grA@PFNuzhh7deFJacn%2oVwzf}n+k#b4{n$_fDi0fY++3&+RDLkJiQ zhM={zH3UUPMIk6ACbqG$0U^Z1#1OQ#wM|Y=PDx3DaEM4sO8zB(@%#7he~GlTG=!w5 zr#m@0{ZpW;tLrbPqM~wfae;6-Ik~K?ti8Rxf6Dwr+}+*#`uY?V6?1cQ|0?tH@{W#< zAe^3_URhZ=KR^Gk-qX_)1_nk&MFo;AC@Apq@){Z%f^b+^SXEV3Z*Ol1hl7JtQ&TG{ zD*9XHFT%sae`V77Q#8p#U0DMPJY)z)1W$p%9bik$MX=-B3-AUw8tefEQ|u*!1HcU6 zQ!qRDrWnlk0VhPjY8=gaZ@oXu1j$ua4*&&4 zfb}OqPtx6pKtZw1%Sno9`WT-FCR@2^7A2vf?BRdL$bt3WM!J= zOgRM(!dMxUO?O=1D#}*whfud(8IyFkSnu{d^4-d!c{~*9qdN6L5xB~hDN^gR7=(ahX%!l$+v&g^|;vpCC%l% ztFzZ+ieSp%=C{0)W$_g&sneIhjdlwC@7yU~jxQvat3e+E=I&QwlG~`I4=pM$h;9?% zp0=JszDrbM>wvmidxu0Le7zO#cZKhbix>H9{DTu>%7ne4-OlE`W&BsE^{l*`ZQ$-G zowMCu(B*K0`ZdoUnwd9b;6V;vWYF_t^{es15t79t6O>C7(Flr#tL@3^K=0hZN4EQk ztuu{4{IP~J4ASwMpGW6=MS8SQ*jAV47CztaTlb8qke~09Kzrq5vH}8w!TXsXER&Op zB=Syf+)_MbOl*c%`ee-TijMlpCg$TBZBC?W~pq}94YryiJla6DLav9F7xV)J-M#ryzgKvi)y17nN&OTDCI%uyA z)WeF0)}DrS;a>_Juv0=i{;Hb;1j6k@fe%cO62@1e6Ln=rPyFWZ+wt7)UNX)N)aqEv z5(KakUu4#z9(6X@#6EQrSo$Y65BM^cRfagI(|;1E1QcEj`5Kp`w?}0o5-hp3QDPg` zx%N5u8!hhxJ3IxM0?YL4ry{JtB-vtLJZ?_HM&44Q(Dt>%>yXLFHO_XV zA{M9AEVkuTFOCrMv|fluG_+sy$(p;-4PMISRUZw`)H%o`%->Z@#J5vPk1x?0lJgih zNmBo|-_1lUE`4f2FT*(|Z*LV(gxepJ&`i-G$MCUTDVUA=0L1-v$zQ)(oz2WAzG%Q6 zwS;@h$eJD9v(xQ8dB#G+nDUTtxMx&8r$zo%=qtQpq;&SZ4hBTDAHik%G6kXM>*# zbt&PEWo04&b*{uYiB+hm)c)ij#01t_(&ItqqNC0 zUM`!(1|@i37<8iu9Q#l!8_>u(+(Jj*4Y>R&h3Ao|_bdg)lQ)ZU_CC}?vPX$v&Hm*t z`DGGPlyA#z#E}b_A3tfq!!u#w0Oc$t++&MU^+j|umW=k2w{P)|qRJyTG6>E2FR&24!;wp#(wO46Z zz!!R_THimh7k5nnd9kB(2x`~wr}Zt>564H9J+38UGDT8sgDz*jg>T5&R0ed?z%=yf z5nNQLGw1$_w^fU<)IPM$J>O?Pa=>o!xdwWS+quk6{lM{#mCy!+2ynQKher-IpKa8T zaXBvtR=A=3I1Ey5wl<1U%lZmq26N!{nfTVH4;KHi6RUeFM3Ur6%oSnJMX1z|ICNC6 z^pU=u?~$!3i?HgAbH(+pL+Vei!LD)b!C$K|g{4C$oh}9?oE~d4OYX0Y=h*|F+r%sS8U*7Vq?0P5|>Fi9nObE;YM+a z2@9s#(-s}+*lx_|yGfToZfh>#i6*ppAI31l9S0*>BRksm)_aF6QXca)n|&`p7c<4P-+j+ZhW^#eywRM1(X2GOyek^M@VXd=cJFc9pTb+` zOK6BCYCJkFyeg76LDY9FEP2zp+DSCScOE7e-{V6LTrYab2og3l_$ST}FlFQxyXUxi zY8qg=E-2CO@ADHkh&Oxa^?Tf|O}wy6AI@ZcPr&Z8LkIV55|7Fu9yT`=aCnP zh&!^D1mjk7CQZ1)!ZA>`W=WwOymKKDYCeMJDEyoQ!w-mwrq-8EO((w0<&{W3n1y?k zgw9WdK^xr!#(V8HSvn-{-M~@XO|V2enj*q;?AZnuz0VfB8f~H1ttV*Kw&PL`Odyt* z#q`9Z#cr7+S1X9o&9boZC^{HVC^sD7i^dO?vB{Hy%4@X|pi$ybD+%R?rB&1|iEPzF zYvbqGTWyR(n0Z>nLyLpqs$QkrV^Y!D$I`d`@jiYsoM@{f&JeQ{1~oD{P7@a%6G^!J z=iLIqQ^p`5<1IXvdNp0*y$=gN8TIYzFoWr+*8U(OvaK!68u6d9G?WUzhsU}OVy>wv zh>*#s-tRHFn+=<=i;E9fuwXMWAg3t&q!)ssHBM8-EG=EJ%s*-lz-8Z~DWkH%3Jyb5 z`07Nbs)|dIjaVe@t0%5Nrh?>o0?S(JX2l=>$SbLv=FAxyRt7~yskeoL#b}|KG(Ud> z5>7vTjg5;9A<{`jp@!@|?HyMUyl_Jc8EC}sR*QFLL$P(f@|Yo zVrFN|MxBx@L7hHv38#pgjPkM&iHQ;xX~TVOF%^fGIy|8(uG1o$)yI4PX>*d({6XXR zDh1;taYq8cP^|pKhmZpp3#i&P_sPwikdft!e0WlnfAE5fQR}URUMr7!C3KYGbCqDo ziq<=;nb_J^4{~s>BQ;4A>^+%#x!$(0i6qzt5f-zh9SJ{GW0m`*2VFjX_GTA-tX(O- zql<3ec!`JBxUSM>-}6%fxo;&}hYCl}p&02xXhJz3NYt;;ko_nR)Cs`zu>081bE zNl5xjEV2R|&uO{R7KMebh$!%^2|K%p;;Ix$q!HM8=ZQXX%axPu8+`uoz-i|k$c`C* z5NR;4+bbgKCja7sx?EW}1k^iJdCf=PVH{c{^V&L^Z9Fz71Z3|59Cw8U(aTdh*xz)) z9a-?psM-lPdkK;sUf6)Y&QnS2Ki zOn~V6j%{o?M`#xVnMOHr`*i)F3g7wWTgxNdZ%3u7BksrYfeU*dfgd+BkM8y*NIP|# zgtuB|%1)*ccPwEtWnd2m5tCKKN`de%M`(kbRSl)nEiJ5(n4>XJ`Wa?$fkW7+5z|iy z7pE7v2B@+^Bgd~uKO!RX$L4yiLL=~YKy7{d-WrZ}djbz-kzeo));nf@&5IkL9Q9h3 zIt@l!34C|vd%#2SjP&k^TYKBI5kwuZvuLeh^B88wx+lUCh~t?4DWLyXR;0k-C9qhp z8u6&tuJrE8=Hdo_9l>KWLFrj|Kgb@UaeL5#XoMIKja~DDCr*eB+6sKsr#;o?AHLXU zE^-5q43P3G+u;rD)IJFK$+uA>0`RxcX%3gA1ObQn+%b5^l2WE>Z=TPp5n5p0PhZJM zd&c1ZTPM(3O=g5|j)hlmZ4>?ce{*O8kEg2iChPXB`=J4XEDVz7AIRbmV(WBDrN%L+ zQM`DLsY}wk5Yi=!85}X^v7e~#{GjC!9#741baR0pUiiIB%I!ybtfsFV>_Rl#v`2tQ zKUZqt1yAp=u1UEs9N@_gqwioaZs)Hmj@w{he#40n#8{$xT&80e8%;7H6`Uq-#`Z7) zWH)x2GT0=c=8IF0U<6+WuBn@#uNB$W2~RcvUC{&&Pk@(&W3tcMIVi|9P0B&uCZBy* zHl?Jt<1WxYe*03^fAK5c$WDw*4oNEhL~Y&-Sb%Z$GT{mHys@W$NHY>cz6re`S`tP? zXaQ4>Q)53ctNNYH9t|X>8jU_daLkN1PM%?bgBZdl{XMc_xx}hC-36!2sAC3|SywYT zEQ#eouCYovL}G;FFr(P$prNE}y5NvumGC6p#W)_bM@sZ)0v;J2`#1BNv1l~x8JX3x zg$`zl{uxrkt%KM=nIEnPBJI~8^+_ayZibNiYy2h7s;5UPI2TE=k))1USoCu2P6m%7 zqQmM-!#LW{$D$^sqH@e=7%|ectT`R@-vmpIq@X21ZDtZ4?4~eR!rr@Hp9dejL1w@@ zwe2K75w%Oe1BkMGMq)Ta6uw}u)SqH;?s$+u?K9_6G!+@p2w)`YfPXxN0(arFAPOZh zHBy=sq|W%Ri=sK$TgRVesFO_}GE4N9x(Hk7I$1OrJl}R?wPwyGn?w!qlBPCM5e5P^ z%%6^t4F7V50B0F|8I!wU?n}YTnL|_H%7?jvKDXk4`{OmXu0Cd5b>>t8?0qK0BPM;g z$?3KehZICOdnMzAGCxZJ;jwm4#9r{L!SgyCRbM^3ecJXZmn2opOSCGV#sZzHd83wz ztrSBl5?5|_p48pAN5HZ>w9Dah$pT6@h{=I~TG8|b(>8_0itoaW9(e;%9wq<>^8bvdogwrZrWnxZtuOCMpR zeZ*0uNL7PCzU4t0*R9ZNwT>f;YBw-T%5W(DJAPpAewp`=s4>5fY;8H)F0(5v(}g{= ziIx-J?S9M0JBX124z9JWmGOQ`VdwXG4E5{W-}wy%xty`?EZV#h)dYxTG@XP9EEnoT%7A^O&^T zL@DJh<)QwJ%h^=shvzs2^90M^f}G(3W2oV<-~IMLS1_|m2JBc@fl=x&Pp;6MRW@I- z68JsRpP)^`huV#1A6bXr9~>C5UL#Yz8lBXY3kei5>B4!1&MnYbapq7y{_=g2b@iUn z4(X+`p>qls_ZUS3W2zr6N&X-yF-(f$Qj*#XOQh)Gv^_!J3bUM7nJEXVn7ubi z63m#JDHrmHc>kfu1W5lJ!?#TCHsQ9SdbllKE%Z`oFz+;)qdN zf4t@4ej-{uY;8e|aN8L2KFr>;`nVACrS+BHTLT>fAPrp~%{P2-*S#j|fL_dbcnHgA z{G9#Urt^2CFulPgfCLw@p@)UCbj?<1F98}W+a8I@ z&$w{Yg06i&Z#qs9bH43DH%kj9PW-$)myjO0`9TLLrgxV=h{`a=H%6Y4cv+eFzf*Zk zEREo*$9&^O2$w=PNExu@!_jANM?d>D_E9&#pVxCf+Xd(ICH(w^836R0e#QadX!Ht| zd$2KvtVI<(bLsRA;o;FxfM*Pm_UzO)qwNN-xCY}wMLXj4zGWcEbWhNj_o+GX!UwysFoUX|pzv+{ry!_`KU-bwyU%AJ08~2nyZz6b_=@+QKa)dp1u7C@s1TRes=!Z+sTcp`&-6onUxz*M<$ z$V_uTemM~To!$*;PQx%1y8Tfq@xWEvV)rPe;E8m&fK8L&io?PBA?-(oBd7)i}Wt#qn0i~t@2q$ z{0i!#>L+N$oxTEE@}KhI*&#G^UK*Oo2iNrgc$QUnyX2gppm{ z1$U5VB@c5bL@ACNe$%C^kMh|bdNlITE z)iG7{OzKa{hem?})OX!#lT3c3k({RQDGiu|we~-Jgck}2iD8KqryIuhZUs<;)A%!6 zj9*DJaMG_px!`g^aaWK(H2l7`&K*8FCL248Es&}lEqLtQ@)*QMDSulYR^W`-S%P|2 z8jryU&F)6+`W8*inuGF>lp=kX2aM(&n|r?W4x^|*12)#)6(JmcSsW&4F9yDI0yWVd zE)Q3If$(#DleM5j;m?J10!P2w;oI@R9c|OUDjd1Xfe zo9?qTyAkp3P;q;|_3CT9tW=KvfQ%#CV+xXENR#JJyt3K(C)K5rpYRWzkv#o^g#peD z)E+aSY>*&6Q)ztI7yHpChlkq8&Vez=rBro^B=nnN$atsJ!fu5<5$NBV{qIx(zy{hHxS9?t6c_yxPJfL51JqK)XbU(cbqNh!t^n+G!iZga5mF@dJ z{XDxE%h~f#v|syQ0&Z`^OjOX$K!EC+#miHK?}4-MDVK0C;(3sh*+wu_=xciIyJ`Nh zh4>&jhxi2W<9K@ysf|su#JnkPiC!i;Y=xO4-T3%X1%d4);e%so zNC3+^jikgqW8iLq5~*#Bm2xX!W4wR>@jf&}>Wcbj*zQ9Y0GiOvN3}XSR}YsS=Yj8* zT?Gw*Jp|(o+6jF58r+z?P(KNe3=nSN%xJCh31hX5C>4e z%V92G5rc5YGv$m8A9{BB7&hqRWQ{*81^p)3|IF1>cr2%0G(uFdF?rhVGj$tkB>7pk zDIFB(0dK{FB8|TWqYrI!xM29%MdF1601Z~N6;WJ9+>e7N7|DyGi|w%MHzZ=4!N#73gE~b8M&adlv9F}W^w0Vn@=aM<$cXjl_|pi6@Virsr%Qt3 ze4587PYD+rgSOf`$Xos>2~>6H3+2)%>b2X6}^wpz0-#M zWgm5lJKmte!bAUfuXzS2PyExCdmzDYz!SGH{d<;XZIfA0W2d*<*EG{241-gY+$i0{ zRVHseVDw-r1KOG75cRI%yXO5csIq|GUkM#)P_miM-PCn4uAWxb_#=8*c$#wsY^vJL z0tiRXx~MXPZ&;@3jLGsN>`O{d(2h>BLLu#;H;AZ`Q_>#5_%oG+b69y~qv-N*YhZbd zu2X&7rBfX%=zlmDID~VAYm}OL9xo6TXhWdQsPISIbv!KjQ~$oDzcndz(T(`j9eSEH z8N}*@v&0d7Sdnk~t%`xO9pHBShPEJ>AimlH-T0%pq?5}xn9v&uZ2&YpW@w`405x&(hf*=XMnq#H5 zNt z8d`YCEtgXmnkxgpqbQLt8Vl48yyTG+y2nqHS~7kbewdo$oo)nRus(KD4tMkK*O`KeP**o zStF!h+CzD|e9CrbhYQx7{3o?zbJfcGygi`1@*J4Diy*5`gZ z8T*2+B3b0^(t9bps;16@|0DeTI|}{#F*EH%00~tQ|5xD5XEEel5@G}W1Sm`KV1u#) zG)THiBeAj9n}-h?LH*+I-gaG&T@+)Z3buCT*O(JJYg8HUy1!{*E237 zK4Ef;hwu*hX1iZZl_aSsE0k~&huILX2Zi{m2Z)v%UuqSM%npFn4BO^Y7HIV7KccK{ z(!hhMu9|^^#`>61(p=2*nT@~*eJ`1&#l)rnS%$#`JJ*y*Ql9b^=IvX_=cT#IyF#M8 zFV6NxBp3xaKBW2Vtds|N~l8m{u{$%?c3m1!x zZ(kZ1vc!H+ECmMC=_yrx_5WM}+$z*nsGGvGXyDeU3d9;8Vjz^VItZUY_0{I% zmM`f11Rcm`;ibA*V^+j}c@G6!AgVhR<=s#uGOa?+ZsQu)%m`g1^ z8`4T2%qRAJ)L^v(?D)H2u?O9XO_ z2Top8BlN|REVl$ckqL8iE6a=P-?x1cj8zzXi1?AUW>f>-njCaGo~$Pag`9;}&e+;1E4y9%pslxY%b3wE6!iFh>{?Ob)i-i(cG77}jxRSIT#V9FfHkk^b*c*e_btGs&T7rC z(PMd)L5*Zsn|1>t%pXh*7&J853aY4}&^`p?WUfiAg&?!Wm;=gz>a)RtwSeO&93aqL=;+&}TqAuy zBe`6m!w5mPDrdpQ!BuE}A^Pot;DXC!iSssSi5$d`Hr0^W0`g(*BGG^HSr8;X2{cvi zzHxIwkQq$f%oAh5PCh`GcAR}FUq;rMHA?c|<0o|&7Kys&^uMkY{mMvpqv3mNu188h>lWlnq8*1_kS5|Z1-pHlu|6a<|=8#Bk>2>nMy#9HU@WDA;P^}HZwIo^MaxT8SIrPD;Spv>oa<_l(cIg zSU4;9IP+5Mz78UamD{g}l_R0k@3szfhvzHv=wUA5lvt~-a_el}X7RFbwCKW`vr_IXrxeHMy-+*P*2aku9KC+&xg_w|P!}t+sYSK~uVck7 z>Roz>H9l8ivw61L@bWvcuZWW|0#8hKLYR?^ibQcW;)Gn?*)QHD#bb~olpFFrz*(8k zZpR&?a>DH$yg?7Z)V?l-HLVPBsjbk6wwm0ny;fbkgGSh=K#H4&Uz$yuns9gCeM4nV z#ah7{?No_)hx;&}5jG{JBRrXFd^yA4;5mmYUZdxoE}FS?!)XBTwO_0}Ip%V@YK&{_g1gyKx`u~ zepRcw?k!W8A(a<*%cMxM1_z)*YZN6Ca|=F*jFLj;@@MlUOqJjD ztLxT1P|LGMYn#q1(e}m-{zMBqbl2sf?fk z*7Hk6csohBP`8KUKOr5FDQdYovYcslv)yFBGNJB%`td&7-C(}JiM0wtqOZyAB--P} zXuZZTUa04KrdUbKUEMb!i+A!k0%S3>9qj2kT9=p|4+Iu4BJ3x43aprT_|5xomuCX$ z88l{fqr;gO`ckHfZK@7S_mI#?sR=ZaeR%}Ob-w*`;|L*_umMvhFtV~fRF8CQB7v*u z*w~HaZ1V@k&EXNAsfTes0eP$sWu!FqD6Kh%aeUpft-Y3SkQ}IH@R+wZXijmwQkvwfm*>tY%#>c4^!3U3^!v^e*Wt~@E2^Q-Rx5J3=4t{|l|D{oGt8lf` z$0IT2^ULL(>gZ{(wVn$u_=hK_4az)Nuj%0vM!-OlGnvV19KQW9`M_|~DkA=NQ~z$V zLsXwg#G_!=o%B^U`+lD;A7wun=DkSUPwg-Q32pt>tFyC*cLC|!Z(nO8abN=84tG26 zGz`m_Zp+hG3T6Jvh;+dOlUjcyc5m}}v*dWwkRlQi$ZQm}2j3;q`V(yzhkY*^UzuTB z!$5h4*YvwQFCiaJ@Z2D8OlH^Q%Nr9|Zm{`|6I@eYg9mdauSt9Vf%XN{CHYUva2H)4 z;sLEkdyE8%a4_%`jS6T;{l!wX!&BGSBM3|Z1l>^p4LL<;@TVpI`*kVw!z+m6V9Q~# zr{INC1FHGZsWrQC`R00r zctfPDZ$sufVOHF_`w#_Tp3y8vJ=~Oi^LVDI-Uk*hT3zkPkp{S_ymFju;)WQe{4C7G zb1o{Io2;}Yco}}Vg^mhGFL4`pAV)390gcpNR_hv4;l#mYwR=W7Zlb}YHN6L2Hgox; znzA~VGh=??e6C?*0@MGkXz?ws;BtMf)!%icY}xDv#{QnAnw{Q5J~tjc+7rw84J3ygo^g0AEYJMR6eMU}j+TUoGo4P(A1+{(7m#P!d=e z|F%lQy88CC6GYZ}@inUJB{WMbp+f=fs2=`&wSASTFds;AK7F7~jYJq2J=>gz#S%zg zSMFJ#7MG)s>Dc&Y_ls7Nds`7M|q%0{(oz>2EsHUR0vxsiqqkB2AXV4aDHBF+UKB@JA4$L%b zEgLkDF_=;++(XBG>D1z%l#7$rkg^^7pj?jZWL0B?AgSQM-7L4fwuUOa2U|+Jb+Bzt zrX{c%nw{j{{77koKjOSxji5}p6?k`Fg;_E!p5DlUy74t<{gErp)g; za5UOjQ+=mF;)}e7O~~_5!k2%&58GPAbJwo*g4SE}%@!2HSwU0Sd`Aoen1qWm>8D3T z$u7e$=9Y{4?64nZQSI4bc&tA$z`j=Y6QBGD(6B8kGW|_cU+TwB zrdB%`6=&6*hH_b8%?G|)JKahCrq3w{GNOY$yaQ&E z@4pt?f@W$hDPQeUqtiQjXfaul=E^B6nTL4v6bNrn}WH%?Tids~R`V((z35)9;i?& zYcr8x*By4!5boGk1Ksy!TJ3;=o{>liuawku`_8FX5_Edi!#E^es3YdIy=e|mor0#jZa7p7q^SsbwtMfAT==1wmRMQZ-;rd%%v$PybcYC+}X3%|JqQ?YpBelqt@s9trzOD$|ho(XY}Vy;Wi{-&a1x? z9=JPbyWJ2u8%vqoJ}aToWZyI=OdN=3Xg-#$xY$zw3!<$QSqaKM4ifYPX~0e#2(ehW z12JjwdXMk&iH_$Fb{F~&kyn+e-FaLX<&0ea?ATFp-FKIl0}ptYzkV607nRVJ#?JVV zu2>J#5yAYY)OuXNmD9t735l=J%h>D(dg&$lrBA@PBnJ+2PBiHJ_Kc6Le1A3>C8?mB z`#rEVt?%oMg>jm*Y_$bIigd+nxblCtmKWEdqEAVw3<5trL`4ws=`BQJ<=Z2!c303i8KacoWcx28GwjwW zV6)T>08JVjEyg&QJK4=O{*GwI0or5Ny|OQX783G8cDyx6joz9eSxGwlZJ<7+V^r-T z^N(>J6qtP#|fE$p_09wkF%ta9rH;;locP3pLSW6K|JJwQ~ zLZabk-*+L(hO@s~GBI~AH^Gm6Xh>Q-GD>BM0>A4HxIO-va{da;@$f;=J{dR>Z}$o; zeB8@P#7(o*yhgL0;Y#}7t^JLy)ivX`w*>(D;+8bmBACnHnZ{|2N)Q)vldf0}TmNqt z)}#NgpdBvN2npI|xl;}QTmSE14x6noK7ZzpM3^?^8N2U}CCj=(n>Hl{IbCGSvJ!;u wyBk4{9&rC())_P)+Q4E*onTw5`BjC`ugSZ^6vKbYOS*|j+O#+ zex1q9rOna4+umiWu!Xz8`TYDLg^u$0_>{!Rb+ftA=ID5}x`DdC*68YAr>(o%+>OA+ zCWw$hm!81f-*K_Gu+-Q7{{E1|$9=fH>htuN$IGhF)Z*{(7JrDK%g?vh+Wh_f@%Q-n z`}_U={w0Ty@AmiT^7G&A?{2TP?Dh4i&(i>NegFUesh-Q900009a7bBm000XU000XU z0RWnu7ytkO2XskIMF-vj1{W^@$2n$A000ZONkl?Y4I1|NpDk0|^P404jCccQYUMy0)fBZj;H(GlP{}*%X$U$*yE>gk@-^04jhA zpaQ5c0aO4LK!pjQ0;m8gOaK)?1<-#R=xu3ljgqjl>;SNFEBV4QH33ur6+i`0VFIWC zDu8}pYcBFU`vith9yo&^-ghsrM)?Gr6|a=X^8Xm#uJq5+Yl6 zy=nga-vjEfqxDS!&~f@aQ(Y`i0lK{JjvngI^_gBM|1h8uGhx4x9nh^AS4RR}b=#_B z+QF}H7y8{*`3C{D2h3-~?_tXdA?_FMWJ}pt%Y)w(~VW&5u~1ZQ_2eE0Gr!B9OB_zdg{6PK`Cb z2I%HC4(I|eLVH~SUN5@ghFX1lpbaV#G*1F*YwFH4&oYxd3jp*H-(PM4&)`#q&bMz0 zlyai8%}GE_B!k?1UO95CX90lXEp6~!nc50wxGNib1;Ta3G zj(Ns8NPK6;^4kHmX#sA;bD=r&B%rMB`@5e;+8lD|_L{0`-D6 zJ`Jef2Y_DlfT9!L9>ve%7h3pI`P*&zHnk}|VD}wPX6Zzr1z?HxI6z;~n^cpg@h3(V z|I0v&8i$5Mr8kT-Obhe|NXyq8pm`=z<(kK?0Kz`%9nCX5wV#i59WA}R-i_1NZ6$H3 z|H|K~yRp++cNqtCRAM>p^Ac)FT9s3QLV`e*0~7^B)8vJLvN$_9;7XEV7?!rja;1g4 zLe`3$gKIS!5-e<&5n79uv9tY$yDAdbw58HJALv4%{)^`_uxSLj41rEzph!EgQ)tLH z2JJo$`ziP0`}b;8g9Y`|qQM5xU1~%vl--r+V6*Yc13G)9RAhs`9I`(r1BL2%eHiGU z=sm>QE!sOP8YmE`**#{Fehxw1roRM%UfY0F{>TBEr|TRta$iIGr_ED=LLzk=2I@fh z8qd&S7Zh#+pv^8=WY8iWvdc@EwHE*=tZ7K^JfL(X?jcxM)LUA9`9z>gkC$aJK=JXF zuEb$bq38jq+r|4qHccCrwYNK%U)nJ$5uox%DK@PHfa=hJp+sD0>qMaII7O5O`Vp+T zr*tY(kGkPtg$9(L)}zPDyK-wW=ivT$2l+arJyEe!*(Y&vd&Ko`fj&@jgG*dWhA8T3s(N6r4QrZ8ryj$FZOUW&$a zXv-gXKJ~i$yIyvy__#N2V4x8vTA(5r{`sc74qV=L7+5QOi+kGIg?9ra-SbH6<^+qg3XR z3K<5fGUMjKEA##TMsWRX{}BaOw3;+fm6uiQ@(2hh?J(_bvggP@1J5$zLiDBST%msF$>oo2$T*w)o2@IFH4{uUMo)XSfE1)D73s$fLkMi zEx2ISC%hg8dIxm2*!WgKp!AvUmLuo>B153+k_&X40Z^u!i1fC@upX6zlZO$R&eqs1 z75#`N9H6ul-Ofm33QZXSRjCP6K$oX(`8ok~7+2M^LPza!G*6Ro%QbG7r+;r^XA1+J z)7r%{$Ef(30JZycC7nK$EU-Bs`IIjbK-=KR=U`=g;^}ir0?6&$5kO5~F;|`vfOaV- zI@DRQEeoJV6qUpWbc8yh6F}iwl#b63q)|DF4w^(P^cwbnjQvgm+N9)pX-bW_$^@wG zUu7PU@zB7$=H^47Wu9H9unudJ9xomD4;%avsov9N!%{yU zGt=yOht~I-B zA~$~#phybJy{E2uBKhBm0~Lx$=y>XVJv@8J{AM6#)$YOTlKxud`NObkS z9_R<`MBA4Hik0rfUT@?a%tsn1Sb|1%^6N0zGU2D3mifitWt9z3_?Zvfw{;nyFR1ZD zx{v+EYo)wkP32KtpLehUg4?ry3JQxi8SNBSaT1rdW*<@Pk7*7by5- zXYJBJ@o9tm1=%EC2I{*w)4SsphXZebdM0xp{2IV86CVn7#)kUhrGSRr^P3!~G{1yN zvil1FY8T;>FRF*4qVmQo^W>Hwnmrq6k0WDU7AVqMW=09sI8@8J}nbjNT`ZRB-DQAYE%L59jSPg*V0^g}G!s^k0f!c!eT zJ?N}#<&CI%aXwJii4sxW(Lf8PTAI7_Q-JzyCdpu0`CP^41Krq?(=YYZ@Sa`r zgj2$mW521rQmLcmfL(b$Q06N}2<`l6pz7RJt%7?JP+w1~RjKc=_+-Feb>`9)tx3$c z{ix0CfHKb)5Y_9Wfw~3PRk#111k``&#C`3^+XGL{TX&)0k9o3rz%5X$mwt9YnXhSj zI0L9Ra!Xdlt(*qb_q!^uW7oYcbLCOT?=r0HDLcNk2Cts0XD5zOX$o81IU4ALt5zJZ z=bs96i?o`9%KOi)7`=Jx09*9pwl!ExR#avWn4Nn+TcFoKb(#lsMm8Hjr~KS?-JX92 z(Cy6@s}?bBJEz?i;syNui82U32{-1O-3ld-@DESgJR->GLuYHlJ^-{lb@s1qu3a3I6DuOY z5&fdKx4(1uob*WSyI$*0tJO}UuKeZifof)Ql?=Z>)ZzEr{zE2!3ZMe004jhApx*~5 z?jxQ|*lyyhG&a(gRO-18wK(m`Ut^QQt?HAjY;1D+tteUi#jl`0Y)w3+7ys>P|6|MK zPpAd0EmHwBBcM65`|eOh7C^HD+7Unn&@6!(W9dvA2i0H_XxTgavOmNkjn|&EMAmFB zPc@$b>M#EhTSYDVz`i3grEG!r1<;IaYMWcLuLV$H0;m8gfC>{p1yBK0m;fq(3ZTLS iPyti`6+ne$WB&o{o8C{n)T1u|0000= this many chars +\righthyphenmin=60 % only hyphenate if the right part is >= this many chars + + +%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% +% Bulleted (itemized) lists +% Align bullets with section header +% Align text left +% Small bullets +% \compactitem for single-spaced lists (used in the Examples doc) + +\usepackage{enumitem} % for setting margins on lists +\setlist{leftmargin=*} % don't indent bullet items +\renewcommand{\labelitemi}{{\normalsize$\bullet$}} % bullet size + +% There is a \compactitem defined in package parlist (and perhaps others), however, +% we'll define our own version of compactitem in terms of package enumitem that +% we already use: +\newenvironment{compactitem} +{\begin{itemize}[itemsep=-1.2ex]} +{\end{itemize}} + + +%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% +% Tables + +% This allows tables to flow across page breaks, headers on each new page, etc. +\usepackage{supertabular} +\usepackage{caption} + + +%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% +% Line numbering + +\usepackage[pagewise]{lineno} % for line numbers on left side of the page +\pagewiselinenumbers +\setlength\linenumbersep{6em} +\renewcommand\linenumberfont{\normalfont\small\sffamily} +\nolinenumbers % start with line numbers off + + +%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% +% Footers + +\usepackage{fancyhdr} % makes right/left footers +\pagestyle{fancy} +\fancyhead{} % clear all header fields +\cfoot{} +\renewcommand{\headrulewidth}{0pt} + +% Left side on even pages: +% This requires that \footerText be defined in the master document: +\fancyfoot[LE]{\bfseries \thepage \mdseries \hspace{2em} \footerText} +\fancyhfoffset[E]{4em} + +% Right side on odd pages: +\fancyfoot[RO]{\mdseries \leftmark \hspace{2em} \bfseries \thepage} + + +%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% +% Section header format - we use four levels: \chapter \section \subsection \subsubsection. + +\usepackage{titlesec} % format headers with \titleformat{} + +% Format and spacing for chapter, section, subsection, and subsubsection headers: + +\setcounter{secnumdepth}{4} % show numbers down to subsubsection level + +\titleformat{\chapter}[display]% +{\normalfont\sffamily\upshape\Huge\bfseries\fontsize{20}{20}\selectfont}% +{\normalfont\sffamily\scshape\large\bfseries \hspace{-0.7in} \MakeUppercase% + {\chaptertitlename} \thechapter}% +{0.8in}{}[\vspace{2ex}\hrule] +\titlespacing{\chapter}{0ex}{0em plus 1em minus 1em}{3em plus 1em minus 1em}[10em] + +\titleformat{\section}[hang]{\huge\bfseries\sffamily\fontsize{16}{16}\selectfont}{\thesection}{1.0em}{} +\titlespacing{\section}{-5em}{5em plus 1em minus 1em}{1em plus 0.5em minus 0em}[10em] + +\titleformat{\subsection}[hang]{\LARGE\bfseries\sffamily\fontsize{14}{14}\selectfont}{\thesubsection}{1.0em}{} +\titlespacing{\subsection}{-5em}{4em plus 1em minus 2.0em}{0.75em plus 0.5em minus 0em}[10em] + +\titleformat{\subsubsection}[hang]{\needspace{1\baselineskip}% +\Large\bfseries\sffamily\fontsize{12}{12}\selectfont}{\thesubsubsection}{1.0em}{} +\titlespacing{\subsubsection}{-5em}{3em plus 1em minus 1em}{0.5em plus 0.5em minus 0em}[10em] + + +%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% +% Macros for minor headers: Summary, Syntax, Description, etc. +% These headers are defined in terms of \paragraph + +\titleformat{\paragraph}[block]{\large\bfseries\sffamily\fontsize{11}{11}\selectfont}{}{}{} +\titlespacing{\paragraph}{0em}{1.5em plus 0.55em minus 0.5em}{0.0em plus 0.55em minus 0.0em} + +% Use one of the convenience macros below, or \littleheader{} for an arbitrary header +\newcommand{\littleheader}[1] {\paragraph*{#1}} + +\newcommand{\binding} {\littleheader{Binding}} +\newcommand{\comments} {\littleheader{Comments}} +\newcommand{\constraints} {\littleheader{Constraints on Arguments}} +\newcommand{\crossreferences} {\littleheader{Cross References}} +\newcommand{\descr} {\littleheader{Description}} +\newcommand{\effect} {\littleheader{Effect}} +\newcommand{\format} {\littleheader{Format}} +\newcommand{\restrictions} {\littleheader{Restrictions}} +\newcommand{\summary} {\littleheader{Summary}} +\newcommand{\syntax} {\littleheader{Syntax}} + + +%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% +% Code and placeholder semantic tagging. +% +% When possible, prefer semantic tags instead of typographic tags. The +% following semantics tags are defined here: +% +% \code{} % for bold monospace keywords, code, operators, etc. +% \plc{} % for italic placeholder names, grammar, etc. +% +% For function prototypes or other code snippets, you can use \code{} as +% the outer wrapper, and use \plc{{} inside. Example: +% +% \code{\#pragma omp directive ( \plc{some-placeholder-identifier} :} +% +% To format text in italics for emphasis (rather than text as a placeholder), +% use the generic \emph{} command. Example: +% +% This sentence \emph{emphasizes some non-placeholder words}. + +% Enable \alltt{} for formatting blocks of code: +\usepackage{alltt} + +% This sets the default \code{} font to tt (monospace) and bold: +\newcommand{\code}[1]{{\texttt{\textbf{#1}}}} +\newcommand{\nspace}[1]{{\textrm{\textmd{ }}}} + +% This defines the \plc{} placeholder font to be tt normal slanted: +\newcommand{\plc}[1] {{\textrm{\textmd{\itshape{#1}}}}} + +% Environment for a paragraph of literal code, single-spaced, no outline, no indenting: +\newenvironment{codepar}[1] +{\begin{alltt}\bfseries #1} +{\end{alltt}} + +% For blocks of code inside a box frame: +\newenvironment{boxedcode}[1] +{\vspace{0.25em plus 5em minus 0.25em}\begin{framed}\begin{minipage}[t]{\textwidth}\begin{alltt}\bfseries #1} +{\end{alltt}\end{minipage}\end{framed}\vspace{0.25em plus 5em minus 0.25em}} + +% This sets the margins in the framed box: +\setlength{\FrameSep}{0.6em} + +% For indented lists of verbatim code at a relaxed line spacing, +% e.g., for use after "where clause is one of the following:" +\usepackage{setspace} +\newenvironment{indentedcodelist}{% + \begin{adjustwidth}{0.25in}{}\begin{spacing}{1.5}\begin{alltt}\bfseries} + {\end{alltt}\end{spacing}\vspace{-0.25\baselineskip}\end{adjustwidth}} + + +%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% +% Macros for the black and blue lines and arrows delineating language-specific +% and notes sections. Example: +% +% \fortranspecificstart +% This is text that applies to Fortran. +% \fortranspecificend + +% local parameters for use \linewitharrows and \notelinewitharrows: +\newlength{\sbsz}\setlength{\sbsz}{0.05in} % size of arrows +\newlength{\sblw}\setlength{\sblw}{1.35pt} % line width (thickness) +\newlength{\sbtw} % text width +\newlength{\sblen} % total width of horizontal rule +\newlength{\sbht} % height of arrows +\newlength{\sbhadj} % vertical adjustment for aligning arrows with the line +\newlength{\sbns}\setlength{\sbns}{7\baselineskip} % arg for \needspace for downward arrows + +% \notelinewitharrows is a helper command that makes a black Note marker: +% arg 1 = 1 or -1 for up or down arrows +% arg 2 = solid or dashed or loosely dashed, etc. +\newcommand{\notelinewitharrows}[2]{% + \needspace{0.1\baselineskip}% + \vbox{\begin{tikzpicture}% + \setlength{\sblen}{\linewidth}% + \setlength{\sbht}{#1\sbsz}\setlength{\sbht}{1.4\sbht}% + \setlength{\sbhadj}{#1\sblw}\setlength{\sbhadj}{0.25\sbhadj}% + \filldraw (\sblen, 0) -- (\sblen - \sbsz, \sbht) -- (\sblen - 2\sbsz, 0) -- (\sblen, 0); + \draw[line width=\sblw, #2] (2\sbsz - \sblw, \sbhadj) -- (\sblen - 2\sbsz + \sblw, \sbhadj); + \filldraw (0, 0) -- (\sbsz, \sbht) -- (0 + 2\sbsz, 0) -- (0, 0); + \end{tikzpicture}}} + +% \linewitharrows is a helper command that makes a blue horizontal line, up or down arrows, and some text: +% arg 1 = 1 or -1 for up or down arrows +% arg 2 = solid or dashed or loosely dashed, etc. +% arg 3 = text +% arg 4 = text width +\newcommand{\linewitharrows}[4]{% + \needspace{0.1\baselineskip}% + \vbox to 1\baselineskip {\begin{tikzpicture}% + \setlength{\sbtw}{#4}% + \setlength{\sblen}{\linewidth}% + \setlength{\sbht}{#1\sbsz}\setlength{\sbht}{1.4\sbht}% + \setlength{\sbhadj}{#1\sblw}\setlength{\sbhadj}{0.25\sbhadj}% + \filldraw[color=blue!40] (\sblen, 0) -- (\sblen - \sbsz, \sbht) -- (\sblen - 2\sbsz, 0) -- (\sblen, 0); + \draw[line width=\sblw, color=blue!40, #2] (2\sbsz - \sblw, \sbhadj) -- (0.5\sblen - 0.5\sbtw, \sbhadj); + \draw[line width=\sblw, color=blue!40, #2] (0.5\sblen + 0.5\sbtw, \sbhadj) -- (\sblen - 2\sbsz + \sblw, \sbhadj); + \filldraw[color=blue!40] (0, 0) -- (\sbsz, \sbht) -- (0 + 2\sbsz, 0) -- (0, 0); + \node[color=blue!90] at (0.5\sblen, 0) {\large \textsf{\textup{#3}}}; + \end{tikzpicture}}} + +\newcommand{\VSPb}{\vspace{0.5ex plus 5ex minus 0.25ex}} +\newcommand{\VSPa}{\vspace{0.25ex plus 5ex minus 0.25ex}} + +% C +\newcommand{\cspecificstart}{\needspace{\sbns}\linewitharrows{-1}{solid}{C}{3em}} +\newcommand{\cspecificend}{\linewitharrows{1}{solid}{C}{3em}\bigskip} + +% C/C++ +\newcommand{\ccppspecificstart}{\VSPb\linewitharrows{-1}{solid}{C / C++}{6em}\VSPa} +\newcommand{\ccppspecificend}{\VSPb\linewitharrows{1}{solid}{C / C++}{6em}\VSPa} + +% C++ +\newcommand{\cppspecificstart}{\needspace{\sbns}\linewitharrows{-1}{solid}{C++}{6em}} +\newcommand{\cppspecificend}{\linewitharrows{1}{solid}{C++}{6em}\bigskip} + +% C90 +\newcommand{\cNinetyspecificstart}{\needspace{\sbns}\linewitharrows{-1}{solid}{C90}{4em}} +\newcommand{\cNinetyspecificend}{\linewitharrows{1}{solid}{C90}{4em}\bigskip} + +% C99 +\newcommand{\cNinetyNinespecificstart}{\needspace{\sbns}\linewitharrows{-1}{solid}{C99}{4em}} +\newcommand{\cNinetyNinespecificend}{\linewitharrows{1}{solid}{C99}{4em}\bigskip} + +% Fortran +\newcommand{\fortranspecificstart}{\VSPb\linewitharrows{-1}{solid}{Fortran}{6em}\VSPa} +\newcommand{\fortranspecificend}{\VSPb\linewitharrows{1}{solid}{Fortran}{6em}\VSPa} + +% Note +\newcommand{\notestart}{\VSPb\notelinewitharrows{-1}{solid}\VSPa} +\newcommand{\noteend}{\VSPb\notelinewitharrows{1}{solid}\VSPa} + +% convenience macro for formatting the word "Note:" at the beginning of note blocks: +\newcommand{\noteheader}{{\textrm{\textsf{\textbf\textup\normalsize{{{{Note }}}}}}}} + + +%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% +% Glossary formatting + +\newcommand{\glossaryterm}[1]{\needspace{1ex} +\begin{adjustwidth}{-0.75in}{0.0in} +\nolinenumbers\parbox[b][-0.95\baselineskip][t]{1.4in}{\flushright \textbf{#1}} +\end{adjustwidth}\linenumbers} + +\newcommand{\glossarydefstart}{ +\begin{adjustwidth}{0.79in}{0.0in}} + +\newcommand{\glossarydefend}{ +\end{adjustwidth}\vspace{-1.5\baselineskip}} + + +%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% +% Indexing and Table of Contents + +\usepackage{makeidx} +\usepackage[nodotinlabels]{titletoc} % required for its [nodotinlabels] option + +% Clickable links in TOC and index: +\usepackage[hyperindex=true,linktocpage=true]{hyperref} +\hypersetup{ + colorlinks = true, % Colors links instead of red boxes + urlcolor = blue, % Color for external links + linkcolor = blue % Color for internal links +} + + +%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% +% Formats a cross reference label as "Section X on page Y". + +\newcommand{\specref}[1]{Section~\ref{#1} on page~\pageref{#1}} + + +%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% +% Code example formatting for the Examples document +% This defines: +% /cexample formats blue markers, caption, and code for C/C++ examples +% /fexample formats blue markers, caption, and code for Fortran examples +% Thanks to Jin, Haoqiang H. for the original definitions of the following: + +\usepackage{color,fancyvrb} % for \VerbatimInput +\usepackage{toolbox} % for \toolboxMakeSplit + +\renewcommand\theFancyVerbLine{\normalfont\footnotesize\sffamily S-\arabic{FancyVerbLine}} + +\newcommand{\myreplace}[3]{\bgroup\toolboxMakeSplit*{#1}{DoSplit}% + \long\def\DoReplace##1{\DoSplit{##1}\lefttext\righttext + \lefttext + \toolboxIfElse{\ifx\righttext\undefined}{}% + {#2\expandafter\DoReplace\expandafter{\righttext}}}% + \DoReplace{#3}\egroup} + +\newcommand{\escstr}[1]{\myreplace{_}{\_}{#1}} + +\def\exampleheader#1#2{% + \ifthenelse{ \equal{#1}{} }{ + \def\cname{#2} + \def\ename\cname + }{ + \def\cname{#1.#2} +% Use following line for old numbering + \def\ename{\thechapter.#2} +% Use following for mneumonics +% \def\ename{\escstr{#1}.#2} + } + \noindent + \textit{Example \ename} + %\vspace*{-3mm} +} + +\def\cnexample#1#2{% + \exampleheader{#1}{#2} + \code{\VerbatimInput[numbers=left,numbersep=10ex,firstnumber=1,firstline=8,fontsize=\small]% + %\code{\VerbatimInput[numbers=left,firstnumber=1,firstline=8,fontsize=\small]% + %\code{\VerbatimInput[firstline=8,fontsize=\small]% + {sources/Example_\cname.c}} +} + +\def\fnexample#1#2{% + \exampleheader{#1}{#2} + \code{\VerbatimInput[numbers=left,numbersep=10ex,firstnumber=1,firstline=6,fontsize=\small]% + %\code{\VerbatimInput[numbers=left,firstnumber=1,firstline=6,fontsize=\small]% + %\code{\VerbatimInput[firstline=6,fontsize=\small]% + {sources/Example_\cname.f}} +} + +\newcommand\cexample[2]{% +\needspace{5\baselineskip}\ccppspecificstart +\cnexample{#1}{#2} +\ccppspecificend +} + +\newcommand\fexample[2]{% +\needspace{5\baselineskip}\fortranspecificstart +\fnexample{#1}{#2} +\fortranspecificend +} + + +% Set default fonts: +\rmfamily\mdseries\upshape\normalsize + + +% This is the end of openmp.sty of the OpenMP specification. diff --git a/sources/Example_affinity.1c.c b/sources/Example_affinity.1c.c new file mode 100644 index 0000000..8612024 --- /dev/null +++ b/sources/Example_affinity.1c.c @@ -0,0 +1,15 @@ +/* +* @@name: affinity.1c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: success +*/ +void work(); +void main() +{ +#pragma omp parallel proc_bind(spread) num_threads(4) + { + work(); + } +} diff --git a/sources/Example_affinity.1f.f b/sources/Example_affinity.1f.f new file mode 100644 index 0000000..dbed9e4 --- /dev/null +++ b/sources/Example_affinity.1f.f @@ -0,0 +1,10 @@ +! @@name: affinity.1f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: yes +! @@expect: success + PROGRAM EXAMPLE +!$OMP PARALLEL PROC_BIND(SPREAD) NUM_THREADS(4) + CALL WORK() +!$OMP END PARALLEL + END PROGRAM EXAMPLE diff --git a/sources/Example_affinity.2c.c b/sources/Example_affinity.2c.c new file mode 100644 index 0000000..76445a5 --- /dev/null +++ b/sources/Example_affinity.2c.c @@ -0,0 +1,15 @@ +/* +* @@name: affinity.2c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +void work(); +void foo() +{ + #pragma omp parallel num_threads(16) proc_bind(spread) + { + work(); + } +} diff --git a/sources/Example_affinity.2f.f b/sources/Example_affinity.2f.f new file mode 100644 index 0000000..322a347 --- /dev/null +++ b/sources/Example_affinity.2f.f @@ -0,0 +1,10 @@ +! @@name: affinity.2f +! @@type: F-free +! @@compilable: yes +! @@linkable: no +! @@expect: success +subroutine foo +!$omp parallel num_threads(16) proc_bind(spread) + call work() +!$omp end parallel +end subroutine diff --git a/sources/Example_affinity.3c.c b/sources/Example_affinity.3c.c new file mode 100644 index 0000000..22e6bd1 --- /dev/null +++ b/sources/Example_affinity.3c.c @@ -0,0 +1,15 @@ +/* +* @@name: affinity.3c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: success +*/ +void work(); +void main() +{ +#pragma omp parallel proc_bind(close) num_threads(4) + { + work(); + } +} diff --git a/sources/Example_affinity.3f.f b/sources/Example_affinity.3f.f new file mode 100644 index 0000000..d07e433 --- /dev/null +++ b/sources/Example_affinity.3f.f @@ -0,0 +1,10 @@ +! @@name: affinity.3f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: yes +! @@expect: success + PROGRAM EXAMPLE +!$OMP PARALLEL PROC_BIND(CLOSE) NUM_THREADS(4) + CALL WORK() +!$OMP END PARALLEL + END PROGRAM EXAMPLE diff --git a/sources/Example_affinity.4c.c b/sources/Example_affinity.4c.c new file mode 100644 index 0000000..5c07812 --- /dev/null +++ b/sources/Example_affinity.4c.c @@ -0,0 +1,15 @@ +/* +* @@name: affinity.4c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +void work(); +void foo() +{ + #pragma omp parallel num_threads(16) proc_bind(close) + { + work(); + } +} diff --git a/sources/Example_affinity.4f.f b/sources/Example_affinity.4f.f new file mode 100644 index 0000000..3ef63c8 --- /dev/null +++ b/sources/Example_affinity.4f.f @@ -0,0 +1,10 @@ +! @@name: affinity.4f +! @@type: F-free +! @@compilable: yes +! @@linkable: no +! @@expect: success +subroutine foo +!$omp parallel num_threads(16) proc_bind(close) + call work() +!$omp end parallel +end subroutine diff --git a/sources/Example_affinity.5c.c b/sources/Example_affinity.5c.c new file mode 100644 index 0000000..45d29de --- /dev/null +++ b/sources/Example_affinity.5c.c @@ -0,0 +1,15 @@ +/* +* @@name: affinity.5c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: success +*/ +void work(); +void main() +{ +#pragma omp parallel proc_bind(master) num_threads(4) + { + work(); + } +} diff --git a/sources/Example_affinity.5f.f b/sources/Example_affinity.5f.f new file mode 100644 index 0000000..417890b --- /dev/null +++ b/sources/Example_affinity.5f.f @@ -0,0 +1,10 @@ +! @@name: affinity.5f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: yes +! @@expect: success + PROGRAM EXAMPLE +!$OMP PARALLEL PROC_BIND(MASTER) NUM_THREADS(4) + CALL WORK() +!$OMP END PARALLEL + END PROGRAM EXAMPLE diff --git a/sources/Example_array_sections.1c.c b/sources/Example_array_sections.1c.c new file mode 100644 index 0000000..1d810b1 --- /dev/null +++ b/sources/Example_array_sections.1c.c @@ -0,0 +1,19 @@ +/* +* @@name: array_sections.1c +* @@type: C +* @@compilable: no +* @@linkable: no +* @@expect: failure +*/ +void foo () +{ + int A[30]; +#pragma omp target data map( A[0:4] ) +{ + /* Cannot map distinct parts of the same array */ + #pragma omp target map( A[7:20] ) + { + A[2] = 0; + } +} +} diff --git a/sources/Example_array_sections.1f.f b/sources/Example_array_sections.1f.f new file mode 100644 index 0000000..161cf88 --- /dev/null +++ b/sources/Example_array_sections.1f.f @@ -0,0 +1,15 @@ +! @@name: array_sections.1f +! @@type: F-free +! @@compilable: no +! @@linkable: no +! @@expect: failure +subroutine foo() +integer :: A(30) + A = 1 + !$omp target data map( A(1:4) ) + ! Cannot map distinct parts of the same array + !$omp target map( A(8:27) ) + A(3) = 0 + !$omp end target map + !$omp end target data +end subroutine diff --git a/sources/Example_array_sections.2c.c b/sources/Example_array_sections.2c.c new file mode 100644 index 0000000..09c8822 --- /dev/null +++ b/sources/Example_array_sections.2c.c @@ -0,0 +1,23 @@ +/* +* @@name: array_sections.2c +* @@type: C +* @@compilable: no +* @@linkable: no +* @@expect: failure +*/ +void foo () +{ + int A[30], *p; +#pragma omp target data map( A[0:4] ) +{ + p = &A[0]; + /* invalid because p[3] and A[3] are the same + * location on the host but the array section + * specified via p[...] is not a subset of A[0:4] */ + #pragma omp target map( p[3:20] ) + { + A[2] = 0; + p[8] = 0; + } +} +} diff --git a/sources/Example_array_sections.2f.f b/sources/Example_array_sections.2f.f new file mode 100644 index 0000000..c61d1d3 --- /dev/null +++ b/sources/Example_array_sections.2f.f @@ -0,0 +1,20 @@ +! @@name: array_sections.2f +! @@type: F-free +! @@compilable: no +! @@linkable: no +! @@expect: failure +subroutine foo() +integer,target :: A(30) +integer,pointer :: p(:) + A=1 + !$omp target data map( A(1:4) ) + p=>A + ! invalid because p(4) and A(4) are the same + ! location on the host but the array section + ! specified via p(...) is not a subset of A(1:4) + !$omp target map( p(4:23) ) + A(3) = 0 + p(9) = 0 + !$omp end target + !$omp end target data +end subroutine diff --git a/sources/Example_array_sections.3c.c b/sources/Example_array_sections.3c.c new file mode 100644 index 0000000..4486628 --- /dev/null +++ b/sources/Example_array_sections.3c.c @@ -0,0 +1,20 @@ +/* +* @@name: array_sections.3c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +void foo () +{ + int A[30], *p; +#pragma omp target data map( A[0:4] ) +{ + p = &A[0]; + #pragma omp target map( p[7:20] ) + { + A[2] = 0; + p[8] = 0; + } +} +} diff --git a/sources/Example_array_sections.3f.f b/sources/Example_array_sections.3f.f new file mode 100644 index 0000000..ac48140 --- /dev/null +++ b/sources/Example_array_sections.3f.f @@ -0,0 +1,16 @@ +! @@name: array_sections.3f +! @@type: F-free +! @@compilable: yes +! @@linkable: no +! @@expect: success +subroutine foo() +integer,target :: A(30) +integer,pointer :: p(:) + !$omp target data map( A(1:4) ) + p=>A + !$omp target map( p(8:27) ) + A(3) = 0 + p(9) = 0 + !$omp end target map + !$omp end target data +end subroutine diff --git a/sources/Example_array_sections.4c.c b/sources/Example_array_sections.4c.c new file mode 100644 index 0000000..1147583 --- /dev/null +++ b/sources/Example_array_sections.4c.c @@ -0,0 +1,21 @@ +/* +* @@name: array_sections.4c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +void foo () +{ + int A[30]; +#pragma omp target data map( A[0:10] ) +{ + p = &A[0]; + #pragma omp target map( p[3:7] ) + { + A[2] = 0; + p[8] = 0; + A[8] = 1; + } +} +} diff --git a/sources/Example_array_sections.4f.f b/sources/Example_array_sections.4f.f new file mode 100644 index 0000000..aa06f1c --- /dev/null +++ b/sources/Example_array_sections.4f.f @@ -0,0 +1,17 @@ +! @@name: array_sections.4f +! @@type: F-free +! @@compilable: yes +! @@linkable: no +! @@expect: success +subroutine foo() +integer,target :: A(30) +integer,pointer :: p(:) + !$omp target data map( A(1:10) ) + p=>A + !$omp target map( p(4:10) ) + A(3) = 0 + p(9) = 0 + A(9) = 1 + !$omp end target + !$omp end target data +end subroutine diff --git a/sources/Example_associate.1f.f b/sources/Example_associate.1f.f new file mode 100644 index 0000000..745dc0b --- /dev/null +++ b/sources/Example_associate.1f.f @@ -0,0 +1,13 @@ +! @@name: associate.1f +! @@type: F-fixed +! @@compilable: no +! @@linkable: no +! @@expect: failure + program example + real :: a, c + associate (b => a) +!$omp parallel private(b, c) ! invalid to privatize b + c = 2.0*b +!$omp end parallel + end associate + end program diff --git a/sources/Example_associate.2f.f b/sources/Example_associate.2f.f new file mode 100644 index 0000000..deea829 --- /dev/null +++ b/sources/Example_associate.2f.f @@ -0,0 +1,15 @@ +! @@name: associate.2f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: yes +! @@expect: success + program example + use omp_lib + integer i +!$omp parallel private(i) + i = omp_get_thread_num() + associate(thread_id => i) + print *, thread_id ! print private i value + end associate +!$omp end parallel + end program diff --git a/sources/Example_associate.3f.f b/sources/Example_associate.3f.f new file mode 100644 index 0000000..2d75291 --- /dev/null +++ b/sources/Example_associate.3f.f @@ -0,0 +1,16 @@ +! @@name: associate.3f +! @@type: F-free +! @@compilable: yes +! @@linkable: yes +! @@expect: success +program example + integer :: v + v = 15 +associate(u => v) +!$omp parallel private(v) + v = -1 + print *, v ! private v=-1 + print *, u ! original v=15 +!$omp end parallel +end associate +end program diff --git a/sources/Example_async_target.1c.c b/sources/Example_async_target.1c.c new file mode 100644 index 0000000..3313742 --- /dev/null +++ b/sources/Example_async_target.1c.c @@ -0,0 +1,28 @@ +/* +* @@name: async_target.1c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +#pragma omp declare target +float F(float); +#pragma omp end declare target +#define N 1000000000 +#define CHUNKSZ 1000000 +void init(float *, int); +float Z[N]; +void pipedF() +{ + int C, i; + init(Z, N); + for (C=0; C +extern void init(float *, float *, int); +extern void output(float *, int); +void vec_mult(float *p, float *v1, float *v2, int N, int dev) +{ + int i; + init(p, N); + #pragma omp task depend(out: v1, v2) + #pragma omp target device(dev) map(v1, v2) + { + // check whether on device dev + if (omp_is_initial_device()) + abort(); + v1 = malloc(N*sizeof(float)); + v2 = malloc(N*sizeof(float)); + init(v1,v2); + } + foo(); // execute other work asychronously + #pragma omp task depend(in: v1, v2) + #pragma omp target device(dev) map(to: v1, v2) map(from: p[0:N]) + { + // check whether on device dev + if (omp_is_initial_device()) + abort(); + #pragma omp parallel for + for (i=0; iticketnumber); + while (atomic_read(&lock->turn) != myturn) + ; + // Do some work. The flush is needed to ensure visibility of + // variables not involved in atomic directives + +#pragma omp flush + work(); +#pragma omp flush + // Release the lock + fetch_and_add(&lock->turn); +} diff --git a/sources/Example_atomic.3f.f b/sources/Example_atomic.3f.f new file mode 100644 index 0000000..d71941d --- /dev/null +++ b/sources/Example_atomic.3f.f @@ -0,0 +1,50 @@ +! @@name: atomic.3f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + function fetch_and_add(p) + integer:: fetch_and_add + integer, intent(inout) :: p + +! Atomically read the value of p and then increment it. The previous value is +! returned. This can be used to implement a simple lock as shown below. +!$omp atomic capture + fetch_and_add = p + p = p + 1 +!$omp end atomic + end function fetch_and_add + module m + interface + function fetch_and_add(p) + integer :: fetch_and_add + integer, intent(inout) :: p + end function + function atomic_read(p) + integer :: atomic_read + integer, intent(in) :: p + end function + end interface + type locktype + integer ticketnumber + integer turn + end type + contains + subroutine do_locked_work(lock) + type(locktype), intent(inout) :: lock + integer myturn + integer junk +! obtain the lock + myturn = fetch_and_add(lock%ticketnumber) + do while (atomic_read(lock%turn) .ne. myturn) + continue + enddo +! Do some work. The flush is needed to ensure visibility of variables +! not involved in atomic directives +!$omp flush + call work +!$omp flush +! Release the lock + junk = fetch_and_add(lock%turn) + end subroutine + end module diff --git a/sources/Example_atomic_restrict.1c.c b/sources/Example_atomic_restrict.1c.c new file mode 100644 index 0000000..2b66ece --- /dev/null +++ b/sources/Example_atomic_restrict.1c.c @@ -0,0 +1,23 @@ +/* +* @@name: atomic_restrict.1c +* @@type: C +* @@compilable: maybe +* @@linkable: no +* @@expect: failure +*/ +void atomic_wrong () +{ + union {int n; float x;} u; + +#pragma omp parallel + { +#pragma omp atomic update + u.n++; + +#pragma omp atomic update + u.x += 1.0; + +/* Incorrect because the atomic constructs reference the same location + through incompatible types */ + } +} diff --git a/sources/Example_atomic_restrict.1f.f b/sources/Example_atomic_restrict.1f.f new file mode 100644 index 0000000..f4f5b45 --- /dev/null +++ b/sources/Example_atomic_restrict.1f.f @@ -0,0 +1,19 @@ +! @@name: atomic_restrict.1f +! @@type: F-fixed +! @@compilable: maybe +! @@linkable: no +! @@expect: failure + SUBROUTINE ATOMIC_WRONG() + INTEGER:: I + REAL:: R + EQUIVALENCE(I,R) + +!$OMP PARALLEL +!$OMP ATOMIC UPDATE + I = I + 1 +!$OMP ATOMIC UPDATE + R = R + 1.0 +! incorrect because I and R reference the same location +! but have different types +!$OMP END PARALLEL + END SUBROUTINE ATOMIC_WRONG diff --git a/sources/Example_atomic_restrict.2c.c b/sources/Example_atomic_restrict.2c.c new file mode 100644 index 0000000..b68b08e --- /dev/null +++ b/sources/Example_atomic_restrict.2c.c @@ -0,0 +1,29 @@ +/* +* @@name: atomic_restrict.2c +* @@type: C +* @@compilable: maybe +* @@linkable: no +* @@expect: failure +*/ +void atomic_wrong2 () +{ + int x; + int *i; + float *r; + + i = &x; + r = (float *)&x; + +#pragma omp parallel + { +#pragma omp atomic update + *i += 1; + +#pragma omp atomic update + *r += 1.0; + +/* Incorrect because the atomic constructs reference the same location + through incompatible types */ + + } +} diff --git a/sources/Example_atomic_restrict.2f.f b/sources/Example_atomic_restrict.2f.f new file mode 100644 index 0000000..8cf2008 --- /dev/null +++ b/sources/Example_atomic_restrict.2f.f @@ -0,0 +1,24 @@ +! @@name: atomic_restrict.2f +! @@type: F-fixed +! @@compilable: maybe +! @@linkable: no +! @@expect: failure + SUBROUTINE SUB() + COMMON /BLK/ R + REAL R + +!$OMP ATOMIC UPDATE + R = R + 1.0 + END SUBROUTINE SUB + + SUBROUTINE ATOMIC_WRONG2() + COMMON /BLK/ I + INTEGER I + +!$OMP PARALLEL + +!$OMP ATOMIC UPDATE + I = I + 1 + CALL SUB() +!$OMP END PARALLEL + END SUBROUTINE ATOMIC_WRONG2 diff --git a/sources/Example_atomic_restrict.3f.f b/sources/Example_atomic_restrict.3f.f new file mode 100644 index 0000000..e5659cd --- /dev/null +++ b/sources/Example_atomic_restrict.3f.f @@ -0,0 +1,25 @@ +! @@name: atomic_restrict.3f +! @@type: F-fixed +! @@compilable: maybe +! @@linkable: no +! @@expect: failure + SUBROUTINE ATOMIC_WRONG3 + INTEGER:: I + REAL:: R + EQUIVALENCE(I,R) + +!$OMP PARALLEL +!$OMP ATOMIC UPDATE + I = I + 1 +! incorrect because I and R reference the same location +! but have different types +!$OMP END PARALLEL + +!$OMP PARALLEL +!$OMP ATOMIC UPDATE + R = R + 1.0 +! incorrect because I and R reference the same location +! but have different types +!$OMP END PARALLEL + + END SUBROUTINE ATOMIC_WRONG3 diff --git a/sources/Example_barrier_regions.1c.c b/sources/Example_barrier_regions.1c.c new file mode 100644 index 0000000..47d13a4 --- /dev/null +++ b/sources/Example_barrier_regions.1c.c @@ -0,0 +1,40 @@ +/* +* @@name: barrier_regions.1c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: success +*/ +void work(int n) {} + +void sub3(int n) +{ + work(n); + #pragma omp barrier + work(n); +} + +void sub2(int k) +{ + #pragma omp parallel shared(k) + sub3(k); +} + +void sub1(int n) +{ + int i; + #pragma omp parallel private(i) shared(n) + { + #pragma omp for + for (i=0; ivalue == value) { + found = tree; + } + else { +#pragma omp task shared(found) if(level < 10) + { + binary_tree_t *found_left = NULL; + found_left = search_tree(tree->left, value, level + 1); + if (found_left) { +#pragma omp atomic write + found = found_left; +#pragma omp cancel taskgroup + } + } +#pragma omp task shared(found) if(level < 10) + { + binary_tree_t *found_right = NULL; + found_right = search_tree(tree->right, value, level + 1); + if (found_right) { +#pragma omp atomic write + found = found_right; +#pragma omp cancel taskgroup + } + } +#pragma omp taskwait + } + } + return found; +} +binary_tree_t *search_tree_parallel(binary_tree_t *tree, int value) { + binary_tree_t *found = NULL; +#pragma omp parallel shared(found, tree, value) + { +#pragma omp master + { +#pragma omp taskgroup + { + found = search_tree(tree, value, 0); + } + } + } + return found; +} diff --git a/sources/Example_cancellation.2f.f b/sources/Example_cancellation.2f.f new file mode 100644 index 0000000..e0c3c0c --- /dev/null +++ b/sources/Example_cancellation.2f.f @@ -0,0 +1,71 @@ +! @@name: cancellation.2f +! @@type: F-free +! @@compilable: yes +! @@linkable: no +! @@expect: success +module parallel_search + type binary_tree + integer :: value + type(binary_tree), pointer :: right + type(binary_tree), pointer :: left + end type + +contains + recursive subroutine search_tree(tree, value, level, found) + type(binary_tree), intent(in), pointer :: tree + integer, intent(in) :: value, level + type(binary_tree), pointer :: found + type(binary_tree), pointer :: found_left => NULL(), & + found_right => NULL() + + if (.not. associated(found)) then + allocate(found) + endif + + if (associated(tree)) then + if (tree%value .eq. value) then + found = tree + else +!$omp task shared(found) if(level<10) + call search_tree(tree%left, value, level+1, found_left) + if (associated(found_left)) then +!$omp atomic write + found = found_left + +!$omp cancel taskgroup + endif +!$omp end task + +!$omp task shared(found) if(level<10) + call search_tree(tree%right, value, level+1, found_right) + if (associated(found_right)) then +!$omp atomic write + found = found_right + +!$omp cancel taskgroup + endif +!$omp end task + +!$omp taskwait + endif + endif + end subroutine + + subroutine search_tree_parallel(tree, value, found) + type(binary_tree), intent(in), pointer :: tree + integer, intent(in) :: value + type(binary_tree), pointer :: found + + if (associated(found)) then + allocate(found) + endif +!$omp parallel shared(found, tree, value) +!$omp master +!$omp taskgroup + call search_tree(tree, value, 0, found) +!$omp end taskgroup +!$omp end master +!$omp end parallel + end subroutine + +end module parallel_search diff --git a/sources/Example_carrays_fpriv.1c.c b/sources/Example_carrays_fpriv.1c.c new file mode 100644 index 0000000..b5d3990 --- /dev/null +++ b/sources/Example_carrays_fpriv.1c.c @@ -0,0 +1,38 @@ +/* +* @@name: carrays_fpriv.1c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: success +*/ +#include + +int A[2][2] = {1, 2, 3, 4}; + +void f(int n, int B[n][n], int C[]) +{ + int D[2][2] = {1, 2, 3, 4}; + int E[n][n]; + + assert(n >= 2); + E[1][1] = 4; + + #pragma omp parallel firstprivate(B, C, D, E) + { + assert(sizeof(B) == sizeof(int (*)[n])); + assert(sizeof(C) == sizeof(int*)); + assert(sizeof(D) == 4 * sizeof(int)); + assert(sizeof(E) == n * n * sizeof(int)); + + /* Private B and C have values of original B and C. */ + assert(&B[1][1] == &A[1][1]); + assert(&C[3] == &A[1][1]); + assert(D[1][1] == 4); + assert(E[1][1] == 4); + } +} + +int main() { + f(2, A, A[0]); + return 0; +} diff --git a/sources/Example_collapse.1c.c b/sources/Example_collapse.1c.c new file mode 100644 index 0000000..c066f3e --- /dev/null +++ b/sources/Example_collapse.1c.c @@ -0,0 +1,18 @@ +/* +* @@name: collapse.1c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +void bar(float *a, int i, int j, int k); +int kl, ku, ks, jl, ju, js, il, iu,is; +void sub(float *a) +{ + int i, j, k; + #pragma omp for collapse(2) private(i, k, j) + for (k=kl; k<=ku; k+=ks) + for (j=jl; j<=ju; j+=js) + for (i=il; i<=iu; i+=is) + bar(a,i,j,k); +} diff --git a/sources/Example_collapse.1f.f b/sources/Example_collapse.1f.f new file mode 100644 index 0000000..8f297b5 --- /dev/null +++ b/sources/Example_collapse.1f.f @@ -0,0 +1,20 @@ +! @@name: collapse.1f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + subroutine sub(a) + real a(*) + integer kl, ku, ks, jl, ju, js, il, iu, is + common /csub/ kl, ku, ks, jl, ju, js, il, iu, is + integer i, j, k +!$omp do collapse(2) private(i,j,k) + do k = kl, ku, ks + do j = jl, ju, js + do i = il, iu, is + call bar(a,i,j,k) + enddo + enddo + enddo +!$omp end do + end subroutine diff --git a/sources/Example_collapse.2c.c b/sources/Example_collapse.2c.c new file mode 100644 index 0000000..7a06f42 --- /dev/null +++ b/sources/Example_collapse.2c.c @@ -0,0 +1,24 @@ +/* +* @@name: collapse.2c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +#include +void test() +{ + int j, k, jlast, klast; + #pragma omp parallel + { + #pragma omp for collapse(2) lastprivate(jlast, klast) + for (k=1; k<=2; k++) + for (j=1; j<=3; j++) + { + jlast=j; + klast=k; + } + #pragma omp single + printf("%d %d\n", klast, jlast); + } +} diff --git a/sources/Example_collapse.2f.f b/sources/Example_collapse.2f.f new file mode 100644 index 0000000..6c7d12d --- /dev/null +++ b/sources/Example_collapse.2f.f @@ -0,0 +1,20 @@ +! @@name: collapse.2f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: yes +! @@expect: success + program test +!$omp parallel +!$omp do private(j,k) collapse(2) lastprivate(jlast, klast) + do k = 1,2 + do j = 1,3 + jlast=j + klast=k + enddo + enddo +!$omp end do +!$omp single + print *, klast, jlast +!$omp end single +!$omp end parallel + end program test diff --git a/sources/Example_collapse.3c.c b/sources/Example_collapse.3c.c new file mode 100644 index 0000000..45b5e46 --- /dev/null +++ b/sources/Example_collapse.3c.c @@ -0,0 +1,26 @@ +/* +* @@name: collapse.3c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +#include +#include +void work(int a, int j, int k); +void sub() +{ + int j, k, a; + #pragma omp parallel num_threads(2) + { + #pragma omp for collapse(2) ordered private(j,k) schedule(static,3) + for (k=1; k<=3; k++) + for (j=1; j<=2; j++) + { + #pragma omp ordered + printf("%d %d %d\n", omp_get_thread_num(), k, j); + /* end ordered */ + work(a,j,k); + } + } +} diff --git a/sources/Example_collapse.3f.f b/sources/Example_collapse.3f.f new file mode 100644 index 0000000..f1339a8 --- /dev/null +++ b/sources/Example_collapse.3f.f @@ -0,0 +1,20 @@ +! @@name: collapse.3f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + program test + include 'omp_lib.h' +!$omp parallel num_threads(2) +!$omp do collapse(2) ordered private(j,k) schedule(static,3) + do k = 1,3 + do j = 1,2 +!$omp ordered + print *, omp_get_thread_num(), k, j +!$omp end ordered + call work(a,j,k) + enddo + enddo +!$omp end do +!$omp end parallel + end program test diff --git a/sources/Example_cond_comp.1c.c b/sources/Example_cond_comp.1c.c new file mode 100644 index 0000000..fc6267e --- /dev/null +++ b/sources/Example_cond_comp.1c.c @@ -0,0 +1,18 @@ +/* +* @@name: cond_comp.1c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: success +*/ +#include + +int main() +{ + +# ifdef _OPENMP + printf("Compiled by an OpenMP-compliant implementation.\n"); +# endif + + return 0; +} diff --git a/sources/Example_cond_comp.1f.f b/sources/Example_cond_comp.1f.f new file mode 100644 index 0000000..0deaa06 --- /dev/null +++ b/sources/Example_cond_comp.1f.f @@ -0,0 +1,11 @@ +! @@name: cond_comp.1f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: yes +! @@expect: success + PROGRAM EXAMPLE + +C234567890 +!$ PRINT *, "Compiled by an OpenMP-compliant implementation." + + END PROGRAM EXAMPLE diff --git a/sources/Example_copyin.1c.c b/sources/Example_copyin.1c.c new file mode 100644 index 0000000..76500ff --- /dev/null +++ b/sources/Example_copyin.1c.c @@ -0,0 +1,31 @@ +/* +* @@name: copyin.1c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +#include + +float* work; +int size; +float tol; + +#pragma omp threadprivate(work,size,tol) + +void build() +{ + int i; + work = (float*)malloc( sizeof(float)*size ); + for( i = 0; i < size; ++i ) work[i] = tol; +} + +void copyin_example( float t, int n ) +{ + tol = t; + size = n; + #pragma omp parallel copyin(tol,size) + { + build(); + } +} diff --git a/sources/Example_copyin.1f.f b/sources/Example_copyin.1f.f new file mode 100644 index 0000000..ecc1b71 --- /dev/null +++ b/sources/Example_copyin.1f.f @@ -0,0 +1,28 @@ +! @@name: copyin.1f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + MODULE M + REAL, POINTER, SAVE :: WORK(:) + INTEGER :: SIZE + REAL :: TOL +!$OMP THREADPRIVATE(WORK,SIZE,TOL) + END MODULE M + + SUBROUTINE COPYIN_EXAMPLE( T, N ) + USE M + REAL :: T + INTEGER :: N + TOL = T + SIZE = N +!$OMP PARALLEL COPYIN(TOL,SIZE) + CALL BUILD +!$OMP END PARALLEL + END SUBROUTINE COPYIN_EXAMPLE + + SUBROUTINE BUILD + USE M + ALLOCATE(WORK(SIZE)) + WORK = TOL + END SUBROUTINE BUILD diff --git a/sources/Example_copyprivate.1c.c b/sources/Example_copyprivate.1c.c new file mode 100644 index 0000000..adbe8a8 --- /dev/null +++ b/sources/Example_copyprivate.1c.c @@ -0,0 +1,17 @@ +/* +* @@name: copyprivate.1c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +#include +float x, y; +#pragma omp threadprivate(x, y) + +void init(float a, float b ) { + #pragma omp single copyprivate(a,b,x,y) + { + scanf("%f %f %f %f", &a, &b, &x, &y); + } +} diff --git a/sources/Example_copyprivate.1f.f b/sources/Example_copyprivate.1f.f new file mode 100644 index 0000000..315a38d --- /dev/null +++ b/sources/Example_copyprivate.1f.f @@ -0,0 +1,15 @@ +! @@name: copyprivate.1f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + SUBROUTINE INIT(A,B) + REAL A, B + COMMON /XY/ X,Y +!$OMP THREADPRIVATE (/XY/) + +!$OMP SINGLE + READ (11) A,B,X,Y +!$OMP END SINGLE COPYPRIVATE (A,B,/XY/) + + END SUBROUTINE INIT diff --git a/sources/Example_copyprivate.2c.c b/sources/Example_copyprivate.2c.c new file mode 100644 index 0000000..c389b36 --- /dev/null +++ b/sources/Example_copyprivate.2c.c @@ -0,0 +1,36 @@ +/* +* @@name: copyprivate.2c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +#include +#include + +float read_next( ) { + float * tmp; + float return_val; + + #pragma omp single copyprivate(tmp) + { + tmp = (float *) malloc(sizeof(float)); + } /* copies the pointer only */ + + + #pragma omp master + { + scanf("%f", tmp); + } + + #pragma omp barrier + return_val = *tmp; + #pragma omp barrier + + #pragma omp single nowait + { + free(tmp); + } + + return return_val; +} diff --git a/sources/Example_copyprivate.2f.f b/sources/Example_copyprivate.2f.f new file mode 100644 index 0000000..fa105a0 --- /dev/null +++ b/sources/Example_copyprivate.2f.f @@ -0,0 +1,24 @@ +! @@name: copyprivate.2f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + REAL FUNCTION READ_NEXT() + REAL, POINTER :: TMP + +!$OMP SINGLE + ALLOCATE (TMP) +!$OMP END SINGLE COPYPRIVATE (TMP) ! copies the pointer only + +!$OMP MASTER + READ (11) TMP +!$OMP END MASTER + +!$OMP BARRIER + READ_NEXT = TMP +!$OMP BARRIER + +!$OMP SINGLE + DEALLOCATE (TMP) +!$OMP END SINGLE NOWAIT + END FUNCTION READ_NEXT diff --git a/sources/Example_copyprivate.3c.c b/sources/Example_copyprivate.3c.c new file mode 100644 index 0000000..00f6b0b --- /dev/null +++ b/sources/Example_copyprivate.3c.c @@ -0,0 +1,23 @@ +/* +* @@name: copyprivate.3c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +#include +#include +#include + +omp_lock_t *new_lock() +{ + omp_lock_t *lock_ptr; + + #pragma omp single copyprivate(lock_ptr) + { + lock_ptr = (omp_lock_t *) malloc(sizeof(omp_lock_t)); + omp_init_lock( lock_ptr ); + } + + return lock_ptr; +} diff --git a/sources/Example_copyprivate.3f.f b/sources/Example_copyprivate.3f.f new file mode 100644 index 0000000..1926a61 --- /dev/null +++ b/sources/Example_copyprivate.3f.f @@ -0,0 +1,14 @@ +! @@name: copyprivate.3f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + FUNCTION NEW_LOCK() + USE OMP_LIB ! or INCLUDE "omp_lib.h" + INTEGER(OMP_LOCK_KIND), POINTER :: NEW_LOCK + +!$OMP SINGLE + ALLOCATE(NEW_LOCK) + CALL OMP_INIT_LOCK(NEW_LOCK) +!$OMP END SINGLE COPYPRIVATE(NEW_LOCK) + END FUNCTION NEW_LOCK diff --git a/sources/Example_copyprivate.4f.f b/sources/Example_copyprivate.4f.f new file mode 100644 index 0000000..49b67b5 --- /dev/null +++ b/sources/Example_copyprivate.4f.f @@ -0,0 +1,25 @@ +! @@name: copyprivate.4f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + SUBROUTINE S(N) + INTEGER N + + REAL, DIMENSION(:), ALLOCATABLE :: A + REAL, DIMENSION(:), POINTER :: B + + ALLOCATE (A(N)) +!$OMP SINGLE + ALLOCATE (B(N)) + READ (11) A,B +!$OMP END SINGLE COPYPRIVATE(A,B) + ! Variable A is private and is + ! assigned the same value in each thread + ! Variable B is shared + +!$OMP BARRIER +!$OMP SINGLE + DEALLOCATE (B) +!$OMP END SINGLE NOWAIT + END SUBROUTINE S diff --git a/sources/Example_critical.1c.c b/sources/Example_critical.1c.c new file mode 100644 index 0000000..50b1d86 --- /dev/null +++ b/sources/Example_critical.1c.c @@ -0,0 +1,26 @@ +/* +* @@name: critical.1c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +int dequeue(float *a); +void work(int i, float *a); + +void critical_example(float *x, float *y) +{ + int ix_next, iy_next; + + #pragma omp parallel shared(x, y) private(ix_next, iy_next) + { + #pragma omp critical (xaxis) + ix_next = dequeue(x); + work(ix_next, x); + + #pragma omp critical (yaxis) + iy_next = dequeue(y); + work(iy_next, y); + } + +} diff --git a/sources/Example_critical.1f.f b/sources/Example_critical.1f.f new file mode 100644 index 0000000..921ee2d --- /dev/null +++ b/sources/Example_critical.1f.f @@ -0,0 +1,25 @@ +! @@name: critical.1f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + SUBROUTINE CRITICAL_EXAMPLE(X, Y) + + REAL X(*), Y(*) + INTEGER IX_NEXT, IY_NEXT + +!$OMP PARALLEL SHARED(X, Y) PRIVATE(IX_NEXT, IY_NEXT) + +!$OMP CRITICAL(XAXIS) + CALL DEQUEUE(IX_NEXT, X) +!$OMP END CRITICAL(XAXIS) + CALL WORK(IX_NEXT, X) + +!$OMP CRITICAL(YAXIS) + CALL DEQUEUE(IY_NEXT,Y) +!$OMP END CRITICAL(YAXIS) + CALL WORK(IY_NEXT, Y) + +!$OMP END PARALLEL + + END SUBROUTINE CRITICAL_EXAMPLE diff --git a/sources/Example_declare_target.1c.c b/sources/Example_declare_target.1c.c new file mode 100644 index 0000000..5a7c980 --- /dev/null +++ b/sources/Example_declare_target.1c.c @@ -0,0 +1,18 @@ +/* +* @@name: declare_target.1c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +#pragma omp declare target +extern void fib(int N); +#pragma omp end declare target +#define THRESHOLD 1000000 +void fib_wrapper(int n) +{ + #pragma omp target if(n > THRESHOLD) + { + fib(n); + } +} diff --git a/sources/Example_declare_target.1f.f b/sources/Example_declare_target.1f.f new file mode 100644 index 0000000..ce0cf9c --- /dev/null +++ b/sources/Example_declare_target.1f.f @@ -0,0 +1,23 @@ +! @@name: declare_target.1f +! @@type: F-free +! @@compilable: yes +! @@linkable: yes +! @@expect: success +module module_fib +contains + subroutine fib(N) + integer :: N + !$omp declare target + !... + end subroutine +end module +module params +integer :: THRESHOLD=1000000 +end module +program my_fib +use params +use module_fib + !$omp target if( N > THRESHOLD ) + call fib(N) + !$omp end target +end program diff --git a/sources/Example_declare_target.2c.c b/sources/Example_declare_target.2c.c new file mode 100644 index 0000000..35bef88 --- /dev/null +++ b/sources/Example_declare_target.2c.c @@ -0,0 +1,28 @@ +/* +* @@name: declare_target.2c +* @@type: C++ +* @@compilable: no +* @@linkable: no +* @@expect: failure +*/ +struct typeX +{ + int a; +} +class typeY +{ + int foo() { return a^0x01;} + int a; +} +#pragma omp declare target +struct typeX varX; // ok +class typeY varY; // ok if varY.foo() not called on target device +#pragma omp end declare target +void foo() +{ + #pragma omp target + { + varX.a = 100; // ok + varY.foo(); // error foo() is not available on a target device + } +} diff --git a/sources/Example_declare_target.2f.f b/sources/Example_declare_target.2f.f new file mode 100644 index 0000000..2c95967 --- /dev/null +++ b/sources/Example_declare_target.2f.f @@ -0,0 +1,18 @@ +! @@name: declare_target.2f +! @@type: F-free +! @@compilable: yes +! @@linkable: yes +! @@expect: success +program my_fib +integer :: N = 8 +!$omp declare target(fib) + !$omp target + call fib(N) + !$omp end target +end program +subroutine fib(N) +integer :: N +!$omp declare target + print*,"hello from fib" + !... +end subroutine diff --git a/sources/Example_declare_target.3c.c b/sources/Example_declare_target.3c.c new file mode 100644 index 0000000..31bc938 --- /dev/null +++ b/sources/Example_declare_target.3c.c @@ -0,0 +1,25 @@ +/* +* @@name: declare_target.3c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +#define N 1000 +#pragma omp declare target +float p[N], v1[N], v2[N]; +#pragma omp end declare target +extern void init(float *, float *, int); +extern void output(float *, int); +void vec_mult() +{ + int i; + init(v1, v2, N); + #pragma omp target update to(v1, v2) + #pragma omp target + #pragma omp parallel for + for (i=0; i +int x, y, z[1000]; +#pragma omp threadprivate(x) + +void default_none(int a) { + const int c = 1; + int i = 0; + + #pragma omp parallel default(none) private(a) shared(z) + { + int j = omp_get_num_threads(); + /* O.K. - j is declared within parallel region */ + a = z[j]; /* O.K. - a is listed in private clause */ + /* - z is listed in shared clause */ + x = c; /* O.K. - x is threadprivate */ + /* - c has const-qualified type */ + z[i] = y; /* Error - cannot reference i or y here */ + + #pragma omp for firstprivate(y) + /* Error - Cannot reference y in the firstprivate clause */ + for (i=0; i<10 ; i++) { + z[i] = i; /* O.K. - i is the loop iteration variable */ + } + + z[i] = y; /* Error - cannot reference i or y here */ + } +} diff --git a/sources/Example_default_none.1f.f b/sources/Example_default_none.1f.f new file mode 100644 index 0000000..5df13c1 --- /dev/null +++ b/sources/Example_default_none.1f.f @@ -0,0 +1,37 @@ +! @@name: default_none.1f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + SUBROUTINE DEFAULT_NONE(A) + INCLUDE "omp_lib.h" ! or USE OMP_LIB + + INTEGER A + + INTEGER X, Y, Z(1000) + COMMON/BLOCKX/X + COMMON/BLOCKY/Y + COMMON/BLOCKZ/Z +!$OMP THREADPRIVATE(/BLOCKX/) + + INTEGER I, J + i = 1 + +!$OMP PARALLEL DEFAULT(NONE) PRIVATE(A) SHARED(Z) PRIVATE(J) + J = OMP_GET_NUM_THREADS(); + ! O.K. - J is listed in PRIVATE clause + A = Z(J) ! O.K. - A is listed in PRIVATE clause + ! - Z is listed in SHARED clause + X = 1 ! O.K. - X is THREADPRIVATE + Z(I) = Y ! Error - cannot reference I or Y here + +!$OMP DO firstprivate(y) + ! Error - Cannot reference y in the firstprivate clause + DO I = 1,10 + Z(I) = I ! O.K. - I is the loop iteration variable + END DO + + + Z(I) = Y ! Error - cannot reference I or Y here +!$OMP END PARALLEL + END SUBROUTINE DEFAULT_NONE diff --git a/sources/Example_device.1c.c b/sources/Example_device.1c.c new file mode 100644 index 0000000..ced1e8f --- /dev/null +++ b/sources/Example_device.1c.c @@ -0,0 +1,43 @@ +/* +* @@name: device.1c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +#include +#include +#pragma omp declare target +void vec_mult(float *p, float *v1, float *v2, int N); +extern float *p, *v1, *v2; +extern int N; +#pragma omp end declare target +extern void init_vars(float *, float *, int); +extern void output(float *, int); +void foo() +{ + N = init_vars(&p, &v1, &v2); + #pragma omp target device(42) map(p[:N], v1[:N], v2[:N]) + { + vec_mult(p, v1, v2, N); + } + output(p, N); +} +void vec_mult(float *p, float *v1, float *v2, int N) +{ + int i; + int nthreads = omp_is_initial_device() ? 8 : 1024; + if (!omp_is_initial_device()) + { + printf("1024 threads on target device\n"); + nthreads = 1024; + } + else + { + printf("8 threads on initial device\n"); + nthreads = 8; + } + #pragma omp parallel for private(i) num_threads(nthreads); + for (i=0; i +extern void init(float *, float *, int); +extern void output(float *, int); +void vec_mult(float *p, float *v1, float *v2, int N) +{ + int i; + init(v1, v2, N); + int ndev = omp_get_num_devices(); + int do_offload = (ndev>0 && N>1000000); + #pragma omp target if(do_offload) map(to: v1[0:N], v2[:N]) map(from: p[0:N]) + #pragma omp parallel for if(N>1000) private(i) + for (i=0; i0) .and. (N>1000000) + !$omp target if(do_offload) map(to: v1, v2) map(from: p) + !$omp parallel do if(N>1000) + do i=1,N + p(i) = v1(i) * v2(i) + end do + !$omp end target + call output(p, N) +end subroutine diff --git a/sources/Example_device.3c.c b/sources/Example_device.3c.c new file mode 100644 index 0000000..9782334 --- /dev/null +++ b/sources/Example_device.3c.c @@ -0,0 +1,17 @@ +/* +* @@name: device.3c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +#include +#include +void foo(void) +{ + int default_device = omp_get_default_device(); + printf("Default device = %d\n", default_device); + omp_set_default_device(default_device+1); + if (omp_get_default_device() != default_device+1) + printf("Default device is still = %d\n", default_device); +} diff --git a/sources/Example_device.3f.f b/sources/Example_device.3f.f new file mode 100644 index 0000000..c9d787a --- /dev/null +++ b/sources/Example_device.3f.f @@ -0,0 +1,15 @@ +! @@name: device.3f +! @@type: F-free +! @@compilable: yes +! @@linkable: yes +! @@expect: success +program foo +use omp_lib, ONLY : omp_get_default_device, omp_set_default_device +integer :: old_default_device, new_default_device + old_default_device = omp_get_default_device() + print*, "Default device = ", old_default_device + new_default_device = old_default_device + 1 + call omp_set_default_device(new_default_device) + if (omp_get_default_device() == old_default_device) & + print*,"Default device is STILL = ", old_default_device +end program diff --git a/sources/Example_flush_nolist.1c.c b/sources/Example_flush_nolist.1c.c new file mode 100644 index 0000000..304deb9 --- /dev/null +++ b/sources/Example_flush_nolist.1c.c @@ -0,0 +1,58 @@ +/* +* @@name: flush_nolist.1c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: success +*/ +int x, *p = &x; + +void f1(int *q) +{ + *q = 1; + #pragma omp flush + /* x, p, and *q are flushed */ + /* because they are shared and accessible */ + /* q is not flushed because it is not shared. */ +} + +void f2(int *q) +{ + #pragma omp barrier + *q = 2; + #pragma omp barrier + + /* a barrier implies a flush */ + /* x, p, and *q are flushed */ + /* because they are shared and accessible */ + /* q is not flushed because it is not shared. */ +} + +int g(int n) +{ + int i = 1, j, sum = 0; + *p = 1; + #pragma omp parallel reduction(+: sum) num_threads(10) + { + f1(&j); + + /* i, n and sum were not flushed */ + /* because they were not accessible in f1 */ + /* j was flushed because it was accessible */ + sum += j; + + f2(&j); + + /* i, n, and sum were not flushed */ + /* because they were not accessible in f2 */ + /* j was flushed because it was accessible */ + sum += i + j + *p + n; + } + return sum; +} + +int main() +{ + int result = g(7); + return result; +} diff --git a/sources/Example_flush_nolist.1f.f b/sources/Example_flush_nolist.1f.f new file mode 100644 index 0000000..abd7db3 --- /dev/null +++ b/sources/Example_flush_nolist.1f.f @@ -0,0 +1,68 @@ +! @@name: flush_nolist.1f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: yes +! @@expect: success + SUBROUTINE F1(Q) + COMMON /DATA/ X, P + INTEGER, TARGET :: X + INTEGER, POINTER :: P + INTEGER Q + + Q = 1 +!$OMP FLUSH + ! X, P and Q are flushed + ! because they are shared and accessible + END SUBROUTINE F1 + + SUBROUTINE F2(Q) + COMMON /DATA/ X, P + INTEGER, TARGET :: X + INTEGER, POINTER :: P + INTEGER Q + +!$OMP BARRIER + Q = 2 +!$OMP BARRIER + ! a barrier implies a flush + ! X, P and Q are flushed + ! because they are shared and accessible + END SUBROUTINE F2 + + INTEGER FUNCTION G(N) + COMMON /DATA/ X, P + INTEGER, TARGET :: X + INTEGER, POINTER :: P + INTEGER N + INTEGER I, J, SUM + + I = 1 + SUM = 0 + P = 1 +!$OMP PARALLEL REDUCTION(+: SUM) NUM_THREADS(10) + CALL F1(J) + ! I, N and SUM were not flushed + ! because they were not accessible in F1 + ! J was flushed because it was accessible + SUM = SUM + J + + CALL F2(J) + ! I, N, and SUM were not flushed + ! because they were not accessible in f2 + ! J was flushed because it was accessible + SUM = SUM + I + J + P + N +!$OMP END PARALLEL + + G = SUM + END FUNCTION G + + PROGRAM FLUSH_NOLIST + COMMON /DATA/ X, P + INTEGER, TARGET :: X + INTEGER, POINTER :: P + INTEGER RESULT, G + + P => X + RESULT = G(7) + PRINT *, RESULT + END PROGRAM FLUSH_NOLIST diff --git a/sources/Example_fort_do.1f.f b/sources/Example_fort_do.1f.f new file mode 100644 index 0000000..947d820 --- /dev/null +++ b/sources/Example_fort_do.1f.f @@ -0,0 +1,31 @@ +! @@name: fort_do.1f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + SUBROUTINE WORK(I, J) + INTEGER I,J + END SUBROUTINE WORK + + SUBROUTINE DO_GOOD() + INTEGER I, J + REAL A(1000) + + DO 100 I = 1,10 +!$OMP DO + DO 100 J = 1,10 + CALL WORK(I,J) +100 CONTINUE ! !$OMP ENDDO implied here + +!$OMP DO + DO 200 J = 1,10 +200 A(I) = I + 1 +!$OMP ENDDO + +!$OMP DO + DO 300 I = 1,10 + DO 300 J = 1,10 + CALL WORK(I,J) +300 CONTINUE +!$OMP ENDDO + END SUBROUTINE DO_GOOD diff --git a/sources/Example_fort_do.2f.f b/sources/Example_fort_do.2f.f new file mode 100644 index 0000000..baa6f54 --- /dev/null +++ b/sources/Example_fort_do.2f.f @@ -0,0 +1,19 @@ +! @@name: fort_do.2f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + SUBROUTINE WORK(I, J) + INTEGER I,J + END SUBROUTINE WORK + + SUBROUTINE DO_WRONG + INTEGER I, J + + DO 100 I = 1,10 +!$OMP DO + DO 100 J = 1,10 + CALL WORK(I,J) +100 CONTINUE +!$OMP ENDDO + END SUBROUTINE DO_WRONG diff --git a/sources/Example_fort_loopvar.1f.f b/sources/Example_fort_loopvar.1f.f new file mode 100644 index 0000000..dd7c55d --- /dev/null +++ b/sources/Example_fort_loopvar.1f.f @@ -0,0 +1,19 @@ +! @@name: fort_loopvar.1f +! @@type: F-free +! @@compilable: yes +! @@linkable: no +! @@expect: success +SUBROUTINE PLOOP_1(A,N) +INCLUDE "omp_lib.h" ! or USE OMP_LIB + +REAL A(*) +INTEGER I, MYOFFSET, N + +!$OMP PARALLEL PRIVATE(MYOFFSET) + MYOFFSET = OMP_GET_THREAD_NUM()*N + DO I = 1, N + A(MYOFFSET+I) = FLOAT(I) + ENDDO +!$OMP END PARALLEL + +END SUBROUTINE PLOOP_1 diff --git a/sources/Example_fort_loopvar.2f.f b/sources/Example_fort_loopvar.2f.f new file mode 100644 index 0000000..8d7f408 --- /dev/null +++ b/sources/Example_fort_loopvar.2f.f @@ -0,0 +1,27 @@ +! @@name: fort_loopvar.2f +! @@type: F-free +! @@compilable: yes +! @@linkable: no +! @@expect: success +SUBROUTINE PLOOP_2(A,B,N,I1,I2) +REAL A(*), B(*) +INTEGER I1, I2, N + +!$OMP PARALLEL SHARED(A,B,I1,I2) +!$OMP SECTIONS +!$OMP SECTION + DO I1 = I1, N + IF (A(I1).NE.0.0) EXIT + ENDDO +!$OMP SECTION + DO I2 = I2, N + IF (B(I2).NE.0.0) EXIT + ENDDO +!$OMP END SECTIONS +!$OMP SINGLE + IF (I1.LE.N) PRINT *, 'ITEMS IN A UP TO ', I1, 'ARE ALL ZERO.' + IF (I2.LE.N) PRINT *, 'ITEMS IN B UP TO ', I2, 'ARE ALL ZERO.' +!$OMP END SINGLE +!$OMP END PARALLEL + +END SUBROUTINE PLOOP_2 diff --git a/sources/Example_fort_race.1f.f b/sources/Example_fort_race.1f.f new file mode 100644 index 0000000..ba6e4b2 --- /dev/null +++ b/sources/Example_fort_race.1f.f @@ -0,0 +1,29 @@ +! @@name: fort_race.1f +! @@type: F-free +! @@compilable: yes +! @@linkable: no +! @@expect: rt-error +SUBROUTINE SHARED_RACE + + INCLUDE "omp_lib.h" ! or USE OMP_LIB + + REAL A(20) + INTEGER MYTHREAD + +!$OMP PARALLEL SHARED(A) PRIVATE(MYTHREAD) + + MYTHREAD = OMP_GET_THREAD_NUM() + IF (MYTHREAD .EQ. 0) THEN + CALL SUB(A(1:10)) ! compiler may introduce writes to A(6:10) + ELSE + A(6:10) = 12 + ENDIF + +!$OMP END PARALLEL + +END SUBROUTINE SHARED_RACE + +SUBROUTINE SUB(X) + REAL X(*) + X(1:5) = 4 +END SUBROUTINE SUB diff --git a/sources/Example_fort_sa_private.1f.f b/sources/Example_fort_sa_private.1f.f new file mode 100644 index 0000000..c99d747 --- /dev/null +++ b/sources/Example_fort_sa_private.1f.f @@ -0,0 +1,18 @@ +! @@name: fort_sa_private.1f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: yes +! @@expect: rt-error + SUBROUTINE SUB() + COMMON /BLOCK/ X + PRINT *,X ! X is undefined + END SUBROUTINE SUB + + PROGRAM PRIV_RESTRICT + COMMON /BLOCK/ X + X = 1.0 +!$OMP PARALLEL PRIVATE (X) + X = 2.0 + CALL SUB() +!$OMP END PARALLEL + END PROGRAM PRIV_RESTRICT diff --git a/sources/Example_fort_sa_private.2f.f b/sources/Example_fort_sa_private.2f.f new file mode 100644 index 0000000..284bef9 --- /dev/null +++ b/sources/Example_fort_sa_private.2f.f @@ -0,0 +1,24 @@ +! @@name: fort_sa_private.2f +! @@type: F-fixed +! @@compilable: maybe +! @@linkable: maybe +! @@expect: rt-error + PROGRAM PRIV_RESTRICT2 + COMMON /BLOCK2/ X + X = 1.0 + +!$OMP PARALLEL PRIVATE (X) + X = 2.0 + CALL SUB() +!$OMP END PARALLEL + + CONTAINS + + SUBROUTINE SUB() + COMMON /BLOCK2/ Y + + PRINT *,X ! X is undefined + PRINT *,Y ! Y is undefined + END SUBROUTINE SUB + + END PROGRAM PRIV_RESTRICT2 diff --git a/sources/Example_fort_sa_private.3f.f b/sources/Example_fort_sa_private.3f.f new file mode 100644 index 0000000..3f1e682 --- /dev/null +++ b/sources/Example_fort_sa_private.3f.f @@ -0,0 +1,15 @@ +! @@name: fort_sa_private.3f +! @@type: F-fixed +! @@compilable: maybe +! @@linkable: maybe +! @@expect: rt-error + PROGRAM PRIV_RESTRICT3 + EQUIVALENCE (X,Y) + X = 1.0 + +!$OMP PARALLEL PRIVATE(X) + PRINT *,Y ! Y is undefined + Y = 10 + PRINT *,X ! X is undefined +!$OMP END PARALLEL + END PROGRAM PRIV_RESTRICT3 diff --git a/sources/Example_fort_sa_private.4f.f b/sources/Example_fort_sa_private.4f.f new file mode 100644 index 0000000..5421ca4 --- /dev/null +++ b/sources/Example_fort_sa_private.4f.f @@ -0,0 +1,31 @@ +! @@name: fort_sa_private.4f +! @@type: F-fixed +! @@compilable: maybe +! @@linkable: maybe +! @@expect: rt-error + PROGRAM PRIV_RESTRICT4 + INTEGER I, J + INTEGER A(100), B(100) + EQUIVALENCE (A(51), B(1)) + +!$OMP PARALLEL DO DEFAULT(PRIVATE) PRIVATE(I,J) LASTPRIVATE(A) + DO I=1,100 + DO J=1,100 + B(J) = J - 1 + ENDDO + + DO J=1,100 + A(J) = J ! B becomes undefined at this point + ENDDO + + DO J=1,50 + B(J) = B(J) + 1 ! B is undefined + ! A becomes undefined at this point + ENDDO + ENDDO +!$OMP END PARALLEL DO ! The LASTPRIVATE write for A has + ! undefined results + + PRINT *, B ! B is undefined since the LASTPRIVATE + ! write of A was not defined + END PROGRAM PRIV_RESTRICT4 diff --git a/sources/Example_fort_sa_private.5f.f b/sources/Example_fort_sa_private.5f.f new file mode 100644 index 0000000..58fc92b --- /dev/null +++ b/sources/Example_fort_sa_private.5f.f @@ -0,0 +1,41 @@ +! @@name: fort_sa_private.5f +! @@type: F-fixed +! @@compilable: maybe +! @@linkable: maybe +! @@expect: rt-error + SUBROUTINE SUB1(X) + DIMENSION X(10) + + ! This use of X does not conform to the + ! specification. It would be legal Fortran 90, + ! but the OpenMP private directive allows the + ! compiler to break the sequence association that + ! A had with the rest of the common block. + + FORALL (I = 1:10) X(I) = I + END SUBROUTINE SUB1 + + PROGRAM PRIV_RESTRICT5 + COMMON /BLOCK5/ A + + DIMENSION B(10) + EQUIVALENCE (A,B(1)) + + ! the common block has to be at least 10 words + A = 0 + +!$OMP PARALLEL PRIVATE(/BLOCK5/) + + ! Without the private clause, + ! we would be passing a member of a sequence + ! that is at least ten elements long. + ! With the private clause, A may no longer be + ! sequence-associated. + + CALL SUB1(A) +!$OMP MASTER + PRINT *, A +!$OMP END MASTER + +!$OMP END PARALLEL + END PROGRAM PRIV_RESTRICT5 diff --git a/sources/Example_fort_sp_common.1f.f b/sources/Example_fort_sp_common.1f.f new file mode 100644 index 0000000..37724cc --- /dev/null +++ b/sources/Example_fort_sp_common.1f.f @@ -0,0 +1,16 @@ +! @@name: fort_sp_common.1f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + SUBROUTINE COMMON_GOOD() + COMMON /C/ X,Y + REAL X, Y + +!$OMP PARALLEL PRIVATE (/C/) + ! do work here +!$OMP END PARALLEL +!$OMP PARALLEL SHARED (X,Y) + ! do work here +!$OMP END PARALLEL + END SUBROUTINE COMMON_GOOD diff --git a/sources/Example_fort_sp_common.2f.f b/sources/Example_fort_sp_common.2f.f new file mode 100644 index 0000000..ba6b1de --- /dev/null +++ b/sources/Example_fort_sp_common.2f.f @@ -0,0 +1,22 @@ +! @@name: fort_sp_common.2f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + SUBROUTINE COMMON_GOOD2() + COMMON /C/ X,Y + REAL X, Y + INTEGER I +!$OMP PARALLEL +!$OMP DO PRIVATE(/C/) + DO I=1,1000 + ! do work here + ENDDO +!$OMP END DO +!$OMP DO PRIVATE(X) + DO I=1,1000 + ! do work here + ENDDO +!$OMP END DO +!$OMP END PARALLEL + END SUBROUTINE COMMON_GOOD2 diff --git a/sources/Example_fort_sp_common.3f.f b/sources/Example_fort_sp_common.3f.f new file mode 100644 index 0000000..da6a267 --- /dev/null +++ b/sources/Example_fort_sp_common.3f.f @@ -0,0 +1,14 @@ +! @@name: fort_sp_common.3f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + SUBROUTINE COMMON_GOOD3() + COMMON /C/ X,Y +!$OMP PARALLEL PRIVATE (/C/) + ! do work here +!$OMP END PARALLEL +!$OMP PARALLEL SHARED (/C/) + ! do work here +!$OMP END PARALLEL + END SUBROUTINE COMMON_GOOD3 diff --git a/sources/Example_fort_sp_common.4f.f b/sources/Example_fort_sp_common.4f.f new file mode 100644 index 0000000..2d631a1 --- /dev/null +++ b/sources/Example_fort_sp_common.4f.f @@ -0,0 +1,12 @@ +! @@name: fort_sp_common.4f +! @@type: F-fixed +! @@compilable: no +! @@linkable: no +! @@expect: failure + SUBROUTINE COMMON_WRONG() + COMMON /C/ X,Y +! Incorrect because X is a constituent element of C +!$OMP PARALLEL PRIVATE(/C/), SHARED(X) + ! do work here +!$OMP END PARALLEL + END SUBROUTINE COMMON_WRONG diff --git a/sources/Example_fort_sp_common.5f.f b/sources/Example_fort_sp_common.5f.f new file mode 100644 index 0000000..c9fecc6 --- /dev/null +++ b/sources/Example_fort_sp_common.5f.f @@ -0,0 +1,14 @@ +! @@name: fort_sp_common.5f +! @@type: F-fixed +! @@compilable: no +! @@linkable: no +! @@expect: failure + SUBROUTINE COMMON_WRONG2() + COMMON /C/ X,Y +! Incorrect: common block C cannot be declared both +! shared and private +!$OMP PARALLEL PRIVATE (/C/), SHARED(/C/) + ! do work here +!$OMP END PARALLEL + + END SUBROUTINE COMMON_WRONG2 diff --git a/sources/Example_fpriv_sections.1c.c b/sources/Example_fpriv_sections.1c.c new file mode 100644 index 0000000..b1454ef --- /dev/null +++ b/sources/Example_fpriv_sections.1c.c @@ -0,0 +1,32 @@ +/* +* @@name: fpriv_sections.1c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: success +*/ +#include +#include +#define NT 4 +int main( ) { + int section_count = 0; + omp_set_dynamic(0); + omp_set_num_threads(NT); +#pragma omp parallel +#pragma omp sections firstprivate( section_count ) +{ +#pragma omp section + { + section_count++; + /* may print the number one or two */ + printf( "section_count %d\n", section_count ); + } +#pragma omp section + { + section_count++; + /* may print the number one or two */ + printf( "section_count %d\n", section_count ); + } +} + return 1; +} diff --git a/sources/Example_fpriv_sections.1f.f b/sources/Example_fpriv_sections.1f.f new file mode 100644 index 0000000..53aa6ae --- /dev/null +++ b/sources/Example_fpriv_sections.1f.f @@ -0,0 +1,24 @@ +! @@name: fpriv_sections.1f +! @@type: F-free +! @@compilable: yes +! @@linkable: yes +! @@expect: success +program section + use omp_lib + integer :: section_count = 0 + integer, parameter :: NT = 4 + call omp_set_dynamic(.false.) + call omp_set_num_threads(NT) +!$omp parallel +!$omp sections firstprivate ( section_count ) +!$omp section + section_count = section_count + 1 +! may print the number one or two + print *, 'section_count', section_count +!$omp section + section_count = section_count + 1 +! may print the number one or two + print *, 'section_count', section_count +!$omp end sections +!$omp end parallel +end program section diff --git a/sources/Example_get_nthrs.1c.c b/sources/Example_get_nthrs.1c.c new file mode 100644 index 0000000..4a8aef0 --- /dev/null +++ b/sources/Example_get_nthrs.1c.c @@ -0,0 +1,20 @@ +/* +* @@name: get_nthrs.1c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: rt-error +*/ +#include +void work(int i); + +void incorrect() +{ + int np, i; + + np = omp_get_num_threads(); /* misplaced */ + + #pragma omp parallel for schedule(static) + for (i=0; i < np; i++) + work(i); +} diff --git a/sources/Example_get_nthrs.1f.f b/sources/Example_get_nthrs.1f.f new file mode 100644 index 0000000..706ab0a --- /dev/null +++ b/sources/Example_get_nthrs.1f.f @@ -0,0 +1,21 @@ +! @@name: get_nthrs.1f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: rt-error + SUBROUTINE WORK(I) + INTEGER I + I = I + 1 + END SUBROUTINE WORK + + SUBROUTINE INCORRECT() + INCLUDE "omp_lib.h" ! or USE OMP_LIB + INTEGER I, NP + + NP = OMP_GET_NUM_THREADS() !misplaced: will return 1 +!$OMP PARALLEL DO SCHEDULE(STATIC) + DO I = 0, NP-1 + CALL WORK(I) + ENDDO +!$OMP END PARALLEL DO + END SUBROUTINE INCORRECT diff --git a/sources/Example_get_nthrs.2c.c b/sources/Example_get_nthrs.2c.c new file mode 100644 index 0000000..f4d4efb --- /dev/null +++ b/sources/Example_get_nthrs.2c.c @@ -0,0 +1,20 @@ +/* +* @@name: get_nthrs.2c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +#include +void work(int i); + +void correct() +{ + int i; + + #pragma omp parallel private(i) + { + i = omp_get_thread_num(); + work(i); + } +} diff --git a/sources/Example_get_nthrs.2f.f b/sources/Example_get_nthrs.2f.f new file mode 100644 index 0000000..913f05f --- /dev/null +++ b/sources/Example_get_nthrs.2f.f @@ -0,0 +1,22 @@ +! @@name: get_nthrs.2f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + SUBROUTINE WORK(I) + INTEGER I + + I = I + 1 + + END SUBROUTINE WORK + + SUBROUTINE CORRECT() + INCLUDE "omp_lib.h" ! or USE OMP_LIB + INTEGER I + +!$OMP PARALLEL PRIVATE(I) + I = OMP_GET_THREAD_NUM() + CALL WORK(I) +!$OMP END PARALLEL + + END SUBROUTINE CORRECT diff --git a/sources/Example_icv.1c.c b/sources/Example_icv.1c.c new file mode 100644 index 0000000..28f38b1 --- /dev/null +++ b/sources/Example_icv.1c.c @@ -0,0 +1,50 @@ +/* +* @@name: icv.1c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: success +*/ +#include +#include + +int main (void) +{ + omp_set_nested(1); + omp_set_max_active_levels(8); + omp_set_dynamic(0); + omp_set_num_threads(2); + #pragma omp parallel + { + omp_set_num_threads(3); + + #pragma omp parallel + { + omp_set_num_threads(4); + #pragma omp single + { + /* + * The following should print: + * Inner: max_act_lev=8, num_thds=3, max_thds=4 + * Inner: max_act_lev=8, num_thds=3, max_thds=4 + */ + printf ("Inner: max_act_lev=%d, num_thds=%d, max_thds=%d\n", + omp_get_max_active_levels(), omp_get_num_threads(), + omp_get_max_threads()); + } + } + + #pragma omp barrier + #pragma omp single + { + /* + * The following should print: + * Outer: max_act_lev=8, num_thds=2, max_thds=3 + */ + printf ("Outer: max_act_lev=%d, num_thds=%d, max_thds=%d\n", + omp_get_max_active_levels(), omp_get_num_threads(), + omp_get_max_threads()); + } + } + return 0; +} diff --git a/sources/Example_icv.1f.f b/sources/Example_icv.1f.f new file mode 100644 index 0000000..247dffd --- /dev/null +++ b/sources/Example_icv.1f.f @@ -0,0 +1,38 @@ +! @@name: icv.1f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: yes +! @@expect: success + program icv + use omp_lib + + call omp_set_nested(.true.) + call omp_set_max_active_levels(8) + call omp_set_dynamic(.false.) + call omp_set_num_threads(2) + +!$omp parallel + call omp_set_num_threads(3) + +!$omp parallel + call omp_set_num_threads(4) +!$omp single +! The following should print: +! Inner: max_act_lev= 8 , num_thds= 3 , max_thds= 4 +! Inner: max_act_lev= 8 , num_thds= 3 , max_thds= 4 + print *, "Inner: max_act_lev=", omp_get_max_active_levels(), + & ", num_thds=", omp_get_num_threads(), + & ", max_thds=", omp_get_max_threads() +!$omp end single +!$omp end parallel + +!$omp barrier +!$omp single +! The following should print: +! Outer: max_act_lev= 8 , num_thds= 2 , max_thds= 3 + print *, "Outer: max_act_lev=", omp_get_max_active_levels(), + & ", num_thds=", omp_get_num_threads(), + & ", max_thds=", omp_get_max_threads() +!$omp end single +!$omp end parallel + end diff --git a/sources/Example_init_lock.1c.c b/sources/Example_init_lock.1c.c new file mode 100644 index 0000000..68c1c5b --- /dev/null +++ b/sources/Example_init_lock.1c.c @@ -0,0 +1,21 @@ +/* +* @@name: init_lock.1c +* @@type: C++ +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +#include + +omp_lock_t *new_locks() +{ + int i; + omp_lock_t *lock = new omp_lock_t[1000]; + + #pragma omp parallel for private(i) + for (i=0; i<1000; i++) + { + omp_init_lock(&lock[i]); + } + return lock; +} diff --git a/sources/Example_init_lock.1f.f b/sources/Example_init_lock.1f.f new file mode 100644 index 0000000..7142e65 --- /dev/null +++ b/sources/Example_init_lock.1f.f @@ -0,0 +1,18 @@ +! @@name: init_lock.1f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + FUNCTION NEW_LOCKS() + USE OMP_LIB ! or INCLUDE "omp_lib.h" + INTEGER(OMP_LOCK_KIND), DIMENSION(1000) :: NEW_LOCKS + + INTEGER I + +!$OMP PARALLEL DO PRIVATE(I) + DO I=1,1000 + CALL OMP_INIT_LOCK(NEW_LOCKS(I)) + END DO +!$OMP END PARALLEL DO + + END FUNCTION NEW_LOCKS diff --git a/sources/Example_lastprivate.1c.c b/sources/Example_lastprivate.1c.c new file mode 100644 index 0000000..ce17512 --- /dev/null +++ b/sources/Example_lastprivate.1c.c @@ -0,0 +1,20 @@ +/* +* @@name: lastprivate.1c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +void lastpriv (int n, float *a, float *b) +{ + int i; + + #pragma omp parallel + { + #pragma omp for lastprivate(i) + for (i=0; i +#include +#include + +int main() +{ + int x; + omp_lock_t lck; + + omp_init_lock (&lck); + omp_set_lock (&lck); + x = 0; + +#pragma omp parallel shared (x) + { + #pragma omp master + { + x = x + 1; + omp_unset_lock (&lck); + } + + /* Some more stuff. */ + } + omp_destroy_lock (&lck); + return 0; +} diff --git a/sources/Example_lock_owner.1f.f b/sources/Example_lock_owner.1f.f new file mode 100644 index 0000000..17310a5 --- /dev/null +++ b/sources/Example_lock_owner.1f.f @@ -0,0 +1,25 @@ +! @@name: lock_owner.1f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: yes +! @@expect: success + program lock + use omp_lib + integer :: x + integer (kind=omp_lock_kind) :: lck + + call omp_init_lock (lck) + call omp_set_lock(lck) + x = 0 + +!$omp parallel shared (x) +!$omp master + x = x + 1 + call omp_unset_lock(lck) +!$omp end master + +! Some more stuff. +!$omp end parallel + + call omp_destroy_lock(lck) + end diff --git a/sources/Example_master.1c.c b/sources/Example_master.1c.c new file mode 100644 index 0000000..b11cb70 --- /dev/null +++ b/sources/Example_master.1c.c @@ -0,0 +1,42 @@ +/* +* @@name: master.1c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +#include + +extern float average(float,float,float); + +void master_example( float* x, float* xold, int n, float tol ) +{ + int c, i, toobig; + float error, y; + c = 0; + #pragma omp parallel + { + do{ + #pragma omp for private(i) + for( i = 1; i < n-1; ++i ){ + xold[i] = x[i]; + } + #pragma omp single + { + toobig = 0; + } + #pragma omp for private(i,y,error) reduction(+:toobig) + for( i = 1; i < n-1; ++i ){ + y = x[i]; + x[i] = average( xold[i-1], x[i], xold[i+1] ); + error = y - x[i]; + if( error > tol || error < -tol ) ++toobig; + } + #pragma omp master + { + ++c; + printf( "iteration %d, toobig=%d\n", c, toobig ); + } + }while( toobig > 0 ); + } +} diff --git a/sources/Example_master.1f.f b/sources/Example_master.1f.f new file mode 100644 index 0000000..e27a4c3 --- /dev/null +++ b/sources/Example_master.1f.f @@ -0,0 +1,36 @@ +! @@name: master.1f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + SUBROUTINE MASTER_EXAMPLE( X, XOLD, N, TOL ) + REAL X(*), XOLD(*), TOL + INTEGER N + INTEGER C, I, TOOBIG + REAL ERROR, Y, AVERAGE + EXTERNAL AVERAGE + C = 0 + TOOBIG = 1 +!$OMP PARALLEL + DO WHILE( TOOBIG > 0 ) +!$OMP DO PRIVATE(I) + DO I = 2, N-1 + XOLD(I) = X(I) + ENDDO +!$OMP SINGLE + TOOBIG = 0 +!$OMP END SINGLE +!$OMP DO PRIVATE(I,Y,ERROR), REDUCTION(+:TOOBIG) + DO I = 2, N-1 + Y = X(I) + X(I) = AVERAGE( XOLD(I-1), X(I), XOLD(I+1) ) + ERROR = Y-X(I) + IF( ERROR > TOL .OR. ERROR < -TOL ) TOOBIG = TOOBIG+1 + ENDDO +!$OMP MASTER + C = C + 1 + PRINT *, 'Iteration ', C, 'TOOBIG=', TOOBIG +!$OMP END MASTER + ENDDO +!$OMP END PARALLEL + END SUBROUTINE MASTER_EXAMPLE diff --git a/sources/Example_mem_model.1c.c b/sources/Example_mem_model.1c.c new file mode 100644 index 0000000..136f24c --- /dev/null +++ b/sources/Example_mem_model.1c.c @@ -0,0 +1,36 @@ +/* +* @@name: mem_model.1c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: rt-error +*/ +#include +#include + +int main(){ + int x; + + x = 2; + #pragma omp parallel num_threads(2) shared(x) + { + + if (omp_get_thread_num() == 0) { + x = 5; + } else { + /* Print 1: the following read of x has a race */ + printf("1: Thread# %d: x = %d\n", omp_get_thread_num(),x ); + } + + #pragma omp barrier + + if (omp_get_thread_num() == 0) { + /* Print 2 */ + printf("2: Thread# %d: x = %d\n", omp_get_thread_num(),x ); + } else { + /* Print 3 */ + printf("3: Thread# %d: x = %d\n", omp_get_thread_num(),x ); + } + } + return 0; +} diff --git a/sources/Example_mem_model.1f.f b/sources/Example_mem_model.1f.f new file mode 100644 index 0000000..8530dcc --- /dev/null +++ b/sources/Example_mem_model.1f.f @@ -0,0 +1,32 @@ +! @@name: mem_model.1f +! @@type: F-free +! @@compilable: yes +! @@linkable: yes +! @@expect: rt-error +PROGRAM MEMMODEL + INCLUDE "omp_lib.h" ! or USE OMP_LIB + INTEGER X + + X = 2 +!$OMP PARALLEL NUM_THREADS(2) SHARED(X) + + IF (OMP_GET_THREAD_NUM() .EQ. 0) THEN + X = 5 + ELSE + ! PRINT 1: The following read of x has a race + PRINT *,"1: THREAD# ", OMP_GET_THREAD_NUM(), "X = ", X + ENDIF + + !$OMP BARRIER + + IF (OMP_GET_THREAD_NUM() .EQ. 0) THEN + ! PRINT 2 + PRINT *,"2: THREAD# ", OMP_GET_THREAD_NUM(), "X = ", X + ELSE + ! PRINT 3 + PRINT *,"3: THREAD# ", OMP_GET_THREAD_NUM(), "X = ", X + ENDIF + +!$OMP END PARALLEL + +END PROGRAM MEMMODEL diff --git a/sources/Example_mem_model.2c.c b/sources/Example_mem_model.2c.c new file mode 100644 index 0000000..38e49ad --- /dev/null +++ b/sources/Example_mem_model.2c.c @@ -0,0 +1,48 @@ +/* +* @@name: mem_model.2c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: rt-error +*/ +#include +#include +int main() +{ + int data; + int flag=0; + #pragma omp parallel num_threads(2) + { + if (omp_get_thread_num()==0) + { + /* Write to the data buffer that will be + read by thread */ + data = 42; + /* Flush data to thread 1 and strictly order + the write to data + relative to the write to the flag */ + #pragma omp flush(flag, data) + /* Set flag to release thread 1 */ + flag = 1; + /* Flush flag to ensure that thread 1 sees + the change */ + #pragma omp flush(flag) + } + else if(omp_get_thread_num()==1) + { + /* Loop until we see the update to the flag */ + #pragma omp flush(flag, data) + while (flag < 1) + { + #pragma omp flush(flag, data) + } + /* Values of flag and data are undefined */ + printf("flag=%d data=%d\n", flag, data); + #pragma omp flush(flag, data) + /* Values data will be 42, value of flag + still undefined */ + printf("flag=%d data=%d\n", flag, data); + } + } + return 0; +} diff --git a/sources/Example_mem_model.2f.f b/sources/Example_mem_model.2f.f new file mode 100644 index 0000000..a612293 --- /dev/null +++ b/sources/Example_mem_model.2f.f @@ -0,0 +1,38 @@ +! @@name: mem_model.2f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: yes +! @@expect: rt-error + PROGRAM EXAMPLE + INCLUDE "omp_lib.h" ! or USE OMP_LIB + INTEGER DATA + INTEGER FLAG + + FLAG = 0 + !$OMP PARALLEL NUM_THREADS(2) + IF(OMP_GET_THREAD_NUM() .EQ. 0) THEN + ! Write to the data buffer that will be read by thread 1 + DATA = 42 + ! Flush DATA to thread 1 and strictly order the write to DATA + ! relative to the write to the FLAG + !$OMP FLUSH(FLAG, DATA) + ! Set FLAG to release thread 1 + FLAG = 1; + ! Flush FLAG to ensure that thread 1 sees the change */ + !$OMP FLUSH(FLAG) + ELSE IF(OMP_GET_THREAD_NUM() .EQ. 1) THEN + ! Loop until we see the update to the FLAG + !$OMP FLUSH(FLAG, DATA) + DO WHILE(FLAG .LT. 1) + !$OMP FLUSH(FLAG, DATA) + ENDDO + + ! Values of FLAG and DATA are undefined + PRINT *, 'FLAG=', FLAG, ' DATA=', DATA + !$OMP FLUSH(FLAG, DATA) + + !Values DATA will be 42, value of FLAG still undefined */ + PRINT *, 'FLAG=', FLAG, ' DATA=', DATA + ENDIF + !$OMP END PARALLEL + END diff --git a/sources/Example_mem_model.3c.c b/sources/Example_mem_model.3c.c new file mode 100644 index 0000000..fe6659f --- /dev/null +++ b/sources/Example_mem_model.3c.c @@ -0,0 +1,50 @@ +/* +* @@name: mem_model.3c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: rt-error +*/ +#include +#include +int main() +{ + int flag=0; + + #pragma omp parallel num_threads(3) + { + if(omp_get_thread_num()==0) + { + /* Set flag to release thread 1 */ + #pragma omp atomic update + flag++; + /* Flush of flag is implied by the atomic directive */ + } + else if(omp_get_thread_num()==1) + { + /* Loop until we see that flag reaches 1*/ + #pragma omp flush(flag) + while(flag < 1) + { + #pragma omp flush(flag) + } + printf("Thread 1 awoken\n"); + + /* Set flag to release thread 2 */ + #pragma omp atomic update + flag++; + /* Flush of flag is implied by the atomic directive */ + } + else if(omp_get_thread_num()==2) + { + /* Loop until we see that flag reaches 2 */ + #pragma omp flush(flag) + while(flag < 2) + { + #pragma omp flush(flag) + } + printf("Thread 2 awoken\n"); + } + } + return 0; +} diff --git a/sources/Example_mem_model.3f.f b/sources/Example_mem_model.3f.f new file mode 100644 index 0000000..adfbcb4 --- /dev/null +++ b/sources/Example_mem_model.3f.f @@ -0,0 +1,40 @@ +! @@name: mem_model.3f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: yes +! @@expect: rt-error + PROGRAM EXAMPLE + INCLUDE "omp_lib.h" ! or USE OMP_LIB + INTEGER FLAG + + FLAG = 0 + !$OMP PARALLEL NUM_THREADS(3) + IF(OMP_GET_THREAD_NUM() .EQ. 0) THEN + ! Set flag to release thread 1 + !$OMP ATOMIC UPDATE + FLAG = FLAG + 1 + !Flush of FLAG is implied by the atomic directive + ELSE IF(OMP_GET_THREAD_NUM() .EQ. 1) THEN + ! Loop until we see that FLAG reaches 1 + !$OMP FLUSH(FLAG, DATA) + DO WHILE(FLAG .LT. 1) + !$OMP FLUSH(FLAG, DATA) + ENDDO + + PRINT *, 'Thread 1 awoken' + + ! Set FLAG to release thread 2 + !$OMP ATOMIC UPDATE + FLAG = FLAG + 1 + !Flush of FLAG is implied by the atomic directive + ELSE IF(OMP_GET_THREAD_NUM() .EQ. 2) THEN + ! Loop until we see that FLAG reaches 2 + !$OMP FLUSH(FLAG, DATA) + DO WHILE(FLAG .LT. 2) + !$OMP FLUSH(FLAG, DATA) + ENDDO + + PRINT *, 'Thread 2 awoken' + ENDIF + !$OMP END PARALLEL + END diff --git a/sources/Example_nestable_lock.1c.c b/sources/Example_nestable_lock.1c.c new file mode 100644 index 0000000..c9b2655 --- /dev/null +++ b/sources/Example_nestable_lock.1c.c @@ -0,0 +1,46 @@ +/* +* @@name: nestable_lock.1c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +#include +typedef struct { + int a,b; + omp_nest_lock_t lck; } pair; + +int work1(); +int work2(); +int work3(); +void incr_a(pair *p, int a) +{ + /* Called only from incr_pair, no need to lock. */ + p->a += a; +} +void incr_b(pair *p, int b) +{ + /* Called both from incr_pair and elsewhere, */ + /* so need a nestable lock. */ + + omp_set_nest_lock(&p->lck); + p->b += b; + omp_unset_nest_lock(&p->lck); +} +void incr_pair(pair *p, int a, int b) +{ + omp_set_nest_lock(&p->lck); + incr_a(p, a); + incr_b(p, b); + omp_unset_nest_lock(&p->lck); +} +void nestlock(pair *p) +{ + #pragma omp parallel sections + { + #pragma omp section + incr_pair(p, work1(), work2()); + #pragma omp section + incr_b(p, work3()); + } +} diff --git a/sources/Example_nestable_lock.1f.f b/sources/Example_nestable_lock.1f.f new file mode 100644 index 0000000..41a3198 --- /dev/null +++ b/sources/Example_nestable_lock.1f.f @@ -0,0 +1,63 @@ +! @@name: nestable_lock.1f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + MODULE DATA + USE OMP_LIB, ONLY: OMP_NEST_LOCK_KIND + TYPE LOCKED_PAIR + INTEGER A + INTEGER B + INTEGER (OMP_NEST_LOCK_KIND) LCK + END TYPE + END MODULE DATA + + SUBROUTINE INCR_A(P, A) + ! called only from INCR_PAIR, no need to lock + USE DATA + TYPE(LOCKED_PAIR) :: P + INTEGER A + P%A = P%A + A + END SUBROUTINE INCR_A + + SUBROUTINE INCR_B(P, B) + ! called from both INCR_PAIR and elsewhere, + ! so we need a nestable lock + USE OMP_LIB ! or INCLUDE "omp_lib.h" + USE DATA + TYPE(LOCKED_PAIR) :: P + INTEGER B + CALL OMP_SET_NEST_LOCK(P%LCK) + P%B = P%B + B + CALL OMP_UNSET_NEST_LOCK(P%LCK) + END SUBROUTINE INCR_B + + SUBROUTINE INCR_PAIR(P, A, B) + USE OMP_LIB ! or INCLUDE "omp_lib.h" + USE DATA + TYPE(LOCKED_PAIR) :: P + INTEGER A + INTEGER B + + CALL OMP_SET_NEST_LOCK(P%LCK) + CALL INCR_A(P, A) + CALL INCR_B(P, B) + CALL OMP_UNSET_NEST_LOCK(P%LCK) + END SUBROUTINE INCR_PAIR + + SUBROUTINE NESTLOCK(P) + USE OMP_LIB ! or INCLUDE "omp_lib.h" + USE DATA + TYPE(LOCKED_PAIR) :: P + INTEGER WORK1, WORK2, WORK3 + EXTERNAL WORK1, WORK2, WORK3 + +!$OMP PARALLEL SECTIONS + +!$OMP SECTION + CALL INCR_PAIR(P, WORK1(), WORK2()) +!$OMP SECTION + CALL INCR_B(P, WORK3()) +!$OMP END PARALLEL SECTIONS + + END SUBROUTINE NESTLOCK diff --git a/sources/Example_nested_loop.1c.c b/sources/Example_nested_loop.1c.c new file mode 100644 index 0000000..c8419fb --- /dev/null +++ b/sources/Example_nested_loop.1c.c @@ -0,0 +1,25 @@ +/* +* @@name: nested_loop.1c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +void work(int i, int j) {} + +void good_nesting(int n) +{ + int i, j; + #pragma omp parallel default(shared) + { + #pragma omp for + for (i=0; i + +void nowait_example(int n, int m, float *a, float *b, float *y, float *z) +{ + int i; + #pragma omp parallel + { + #pragma omp for nowait + for (i=1; i +void nowait_example2(int n, float *a, float *b, float *c, float *y, float +*z) +{ + int i; +#pragma omp parallel + { +#pragma omp for schedule(static) nowait + for (i=0; i +int main() +{ + omp_set_dynamic(0); + #pragma omp parallel num_threads(10) + { + /* do work here */ + } + return 0; +} diff --git a/sources/Example_nthrs_dynamic.1f.f b/sources/Example_nthrs_dynamic.1f.f new file mode 100644 index 0000000..614f9b7 --- /dev/null +++ b/sources/Example_nthrs_dynamic.1f.f @@ -0,0 +1,12 @@ +! @@name: nthrs_dynamic.1f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: yes +! @@expect: success + PROGRAM EXAMPLE + INCLUDE "omp_lib.h" ! or USE OMP_LIB + CALL OMP_SET_DYNAMIC(.FALSE.) +!$OMP PARALLEL NUM_THREADS(10) + ! do work here +!$OMP END PARALLEL + END PROGRAM EXAMPLE diff --git a/sources/Example_nthrs_dynamic.2c.c b/sources/Example_nthrs_dynamic.2c.c new file mode 100644 index 0000000..48bd8d1 --- /dev/null +++ b/sources/Example_nthrs_dynamic.2c.c @@ -0,0 +1,17 @@ +/* +* @@name: nthrs_dynamic.2c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: success +*/ +#include +int main() +{ + omp_set_dynamic(1); + #pragma omp parallel num_threads(10) + { + /* do work here */ + } + return 0; +} diff --git a/sources/Example_nthrs_dynamic.2f.f b/sources/Example_nthrs_dynamic.2f.f new file mode 100644 index 0000000..00a3eab --- /dev/null +++ b/sources/Example_nthrs_dynamic.2f.f @@ -0,0 +1,12 @@ +! @@name: nthrs_dynamic.2f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: yes +! @@expect: success + PROGRAM EXAMPLE + INCLUDE "omp_lib.h" ! or USE OMP_LIB + CALL OMP_SET_DYNAMIC(.TRUE.) +!$OMP PARALLEL NUM_THREADS(10) + ! do work here +!$OMP END PARALLEL + END PROGRAM EXAMPLE diff --git a/sources/Example_nthrs_nesting.1c.c b/sources/Example_nthrs_nesting.1c.c new file mode 100644 index 0000000..967f252 --- /dev/null +++ b/sources/Example_nthrs_nesting.1c.c @@ -0,0 +1,58 @@ +/* +* @@name: nthrs_nesting.1c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: success +*/ +#include +#include +int main (void) +{ + omp_set_nested(1); + omp_set_dynamic(0); + #pragma omp parallel + { + #pragma omp parallel + { + #pragma omp single + { + /* + * If OMP_NUM_THREADS=2,3 was set, the following should print: + * Inner: num_thds=3 + * Inner: num_thds=3 + * + * If nesting is not supported, the following should print: + * Inner: num_thds=1 + * Inner: num_thds=1 + */ + printf ("Inner: num_thds=%d\n", omp_get_num_threads()); + } + } + #pragma omp barrier + omp_set_nested(0); + #pragma omp parallel + { + #pragma omp single + { + /* + * Even if OMP_NUM_THREADS=2,3 was set, the following should + * print, because nesting is disabled: + * Inner: num_thds=1 + * Inner: num_thds=1 + */ + printf ("Inner: num_thds=%d\n", omp_get_num_threads()); + } + } + #pragma omp barrier + #pragma omp single + { + /* + * If OMP_NUM_THREADS=2,3 was set, the following should print: + * Outer: num_thds=2 + */ + printf ("Outer: num_thds=%d\n", omp_get_num_threads()); + } + } + return 0; +} diff --git a/sources/Example_nthrs_nesting.1f.f b/sources/Example_nthrs_nesting.1f.f new file mode 100644 index 0000000..463af89 --- /dev/null +++ b/sources/Example_nthrs_nesting.1f.f @@ -0,0 +1,40 @@ +! @@name: nthrs_nesting.1f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: yes +! @@expect: success + program icv + use omp_lib + call omp_set_nested(.true.) + call omp_set_dynamic(.false.) +!$omp parallel +!$omp parallel +!$omp single + ! If OMP_NUM_THREADS=2,3 was set, the following should print: + ! Inner: num_thds= 3 + ! Inner: num_thds= 3 + ! If nesting is not supported, the following should print: + ! Inner: num_thds= 1 + ! Inner: num_thds= 1 + print *, "Inner: num_thds=", omp_get_num_threads() +!$omp end single +!$omp end parallel +!$omp barrier + call omp_set_nested(.false.) +!$omp parallel +!$omp single + ! Even if OMP_NUM_THREADS=2,3 was set, the following should print, + ! because nesting is disabled: + ! Inner: num_thds= 1 + ! Inner: num_thds= 1 + print *, "Inner: num_thds=", omp_get_num_threads() +!$omp end single +!$omp end parallel +!$omp barrier +!$omp single + ! If OMP_NUM_THREADS=2,3 was set, the following should print: + ! Outer: num_thds= 2 + print *, "Outer: num_thds=", omp_get_num_threads() +!$omp end single +!$omp end parallel + end diff --git a/sources/Example_ordered.1c.c b/sources/Example_ordered.1c.c new file mode 100644 index 0000000..15b85c7 --- /dev/null +++ b/sources/Example_ordered.1c.c @@ -0,0 +1,29 @@ +/* +* @@name: ordered.1c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: success +*/ +#include + +void work(int k) +{ + #pragma omp ordered + printf(" %d\n", k); +} + +void ordered_example(int lb, int ub, int stride) +{ + int i; + + #pragma omp parallel for ordered schedule(dynamic) + for (i=lb; i 10) { + #pragma omp ordered + work(i+1); + } + } +} diff --git a/sources/Example_ordered.3f.f b/sources/Example_ordered.3f.f new file mode 100644 index 0000000..65429a8 --- /dev/null +++ b/sources/Example_ordered.3f.f @@ -0,0 +1,23 @@ +! @@name: ordered.3f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + SUBROUTINE ORDERED_GOOD(N) + INTEGER N + +!$OMP DO ORDERED + DO I = 1,N + IF (I <= 10) THEN +!$OMP ORDERED + CALL WORK(I) +!$OMP END ORDERED + ENDIF + + IF (I > 10) THEN +!$OMP ORDERED + CALL WORK(I+1) +!$OMP END ORDERED + ENDIF + ENDDO + END SUBROUTINE ORDERED_GOOD diff --git a/sources/Example_parallel.1c.c b/sources/Example_parallel.1c.c new file mode 100644 index 0000000..b9262a7 --- /dev/null +++ b/sources/Example_parallel.1c.c @@ -0,0 +1,41 @@ +/* +* @@name: parallel.1c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: success +*/ +#include + +void subdomain(float *x, int istart, int ipoints) +{ + int i; + + for (i = 0; i < ipoints; i++) + x[istart+i] = 123.456; +} + +void sub(float *x, int npoints) +{ + int iam, nt, ipoints, istart; + +#pragma omp parallel default(shared) private(iam,nt,ipoints,istart) + { + iam = omp_get_thread_num(); + nt = omp_get_num_threads(); + ipoints = npoints / nt; /* size of partition */ + istart = iam * ipoints; /* starting array index */ + if (iam == nt-1) /* last thread may do more */ + ipoints = npoints - istart; + subdomain(x, istart, ipoints); + } +} + +int main() +{ + float array[10000]; + + sub(array, 10000); + + return 0; +} diff --git a/sources/Example_parallel.1f.f b/sources/Example_parallel.1f.f new file mode 100644 index 0000000..44e156b --- /dev/null +++ b/sources/Example_parallel.1f.f @@ -0,0 +1,42 @@ +! @@name: parallel.1f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: yes +! @@expect: success + SUBROUTINE SUBDOMAIN(X, ISTART, IPOINTS) + INTEGER ISTART, IPOINTS + REAL X(*) + + INTEGER I + + DO 100 I=1,IPOINTS + X(ISTART+I) = 123.456 + 100 CONTINUE + + END SUBROUTINE SUBDOMAIN + + SUBROUTINE SUB(X, NPOINTS) + INCLUDE "omp_lib.h" ! or USE OMP_LIB + + REAL X(*) + INTEGER NPOINTS + INTEGER IAM, NT, IPOINTS, ISTART + +!$OMP PARALLEL DEFAULT(PRIVATE) SHARED(X,NPOINTS) + + IAM = OMP_GET_THREAD_NUM() + NT = OMP_GET_NUM_THREADS() + IPOINTS = NPOINTS/NT + ISTART = IAM * IPOINTS + IF (IAM .EQ. NT-1) THEN + IPOINTS = NPOINTS - ISTART + ENDIF + CALL SUBDOMAIN(X,ISTART,IPOINTS) + +!$OMP END PARALLEL + END SUBROUTINE SUB + + PROGRAM PAREXAMPLE + REAL ARRAY(10000) + CALL SUB(ARRAY, 10000) + END PROGRAM PAREXAMPLE diff --git a/sources/Example_ploop.1c.c b/sources/Example_ploop.1c.c new file mode 100644 index 0000000..dde798f --- /dev/null +++ b/sources/Example_ploop.1c.c @@ -0,0 +1,15 @@ +/* +* @@name: ploop.1c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +void simple(int n, float *a, float *b) +{ + int i; + +#pragma omp parallel for + for (i=1; i +void iterator_example() +{ + std::vector vec(23); + std::vector::iterator it; +#pragma omp parallel for default(none) shared(vec) + for (it = vec.begin(); it < vec.end(); it++) + { + // do work with *it // + } +} diff --git a/sources/Example_private.1c.c b/sources/Example_private.1c.c new file mode 100644 index 0000000..2b16f50 --- /dev/null +++ b/sources/Example_private.1c.c @@ -0,0 +1,32 @@ +/* +* @@name: private.1c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: success +*/ +#include +#include + +int main() +{ + int i, j; + int *ptr_i, *ptr_j; + + i = 1; + j = 2; + + ptr_i = &i; + ptr_j = &j; + + #pragma omp parallel private(i) firstprivate(j) + { + i = 3; + j = j + 2; + assert (*ptr_i == 1 && *ptr_j == 2); + } + + assert(i == 1 && j == 2); + + return 0; +} diff --git a/sources/Example_private.1f.f b/sources/Example_private.1f.f new file mode 100644 index 0000000..fec044f --- /dev/null +++ b/sources/Example_private.1f.f @@ -0,0 +1,18 @@ +! @@name: private.1f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: yes +! @@expect: success + PROGRAM PRIV_EXAMPLE + INTEGER I, J + + I = 1 + J = 2 + +!$OMP PARALLEL PRIVATE(I) FIRSTPRIVATE(J) + I = 3 + J = J + 2 +!$OMP END PARALLEL + + PRINT *, I, J ! I .eq. 1 .and. J .eq. 2 + END PROGRAM PRIV_EXAMPLE diff --git a/sources/Example_private.2c.c b/sources/Example_private.2c.c new file mode 100644 index 0000000..bdbce8a --- /dev/null +++ b/sources/Example_private.2c.c @@ -0,0 +1,25 @@ +/* +* @@name: private.2c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +int a; + +void g(int k) { + a = k; /* Accessed in the region but outside of the construct; + * therefore unspecified whether original or private list + * item is modified. */ +} + + +void f(int n) { + int a = 0; + + #pragma omp parallel for private(a) + for (int i=1; i +void priv_example3() +{ + int i, a; + + #pragma omp parallel private(a) + { + a = 1; + #pragma omp parallel for private(a) + for (i=0; i<10; i++) + { + a = 2; + } + assert(a == 1); + } +} diff --git a/sources/Example_private.3f.f b/sources/Example_private.3f.f new file mode 100644 index 0000000..080884a --- /dev/null +++ b/sources/Example_private.3f.f @@ -0,0 +1,18 @@ +! @@name: private.3f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + SUBROUTINE PRIV_EXAMPLE3() + INTEGER I, A + +!$OMP PARALLEL PRIVATE(A) + A = 1 +!$OMP PARALLEL DO PRIVATE(A) + DO I = 1, 10 + A = 2 + END DO +!$OMP END PARALLEL DO + PRINT *, A ! Outer A still has value 1 +!$OMP END PARALLEL + END SUBROUTINE PRIV_EXAMPLE3 diff --git a/sources/Example_psections.1c.c b/sources/Example_psections.1c.c new file mode 100644 index 0000000..7e1a351 --- /dev/null +++ b/sources/Example_psections.1c.c @@ -0,0 +1,25 @@ +/* +* @@name: psections.1c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +void XAXIS(); +void YAXIS(); +void ZAXIS(); + +void sect_example() +{ + #pragma omp parallel sections + { + #pragma omp section + XAXIS(); + + #pragma omp section + YAXIS(); + + #pragma omp section + ZAXIS(); + } +} diff --git a/sources/Example_psections.1f.f b/sources/Example_psections.1f.f new file mode 100644 index 0000000..3b17366 --- /dev/null +++ b/sources/Example_psections.1f.f @@ -0,0 +1,17 @@ +! @@name: psections.1f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + SUBROUTINE SECT_EXAMPLE() +!$OMP PARALLEL SECTIONS +!$OMP SECTION + CALL XAXIS() +!$OMP SECTION + CALL YAXIS() + +!$OMP SECTION + CALL ZAXIS() + +!$OMP END PARALLEL SECTIONS + END SUBROUTINE SECT_EXAMPLE diff --git a/sources/Example_reduction.1c.c b/sources/Example_reduction.1c.c new file mode 100644 index 0000000..45fcf13 --- /dev/null +++ b/sources/Example_reduction.1c.c @@ -0,0 +1,26 @@ +/* +* @@name: reduction.1c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +#include +void reduction1(float *x, int *y, int n) +{ + int i, b, c; + float a, d; + a = 0.0; + b = 0; + c = y[0]; + d = x[0]; + #pragma omp parallel for private(i) shared(x, y, n) \ + reduction(+:a) reduction(^:b) \ + reduction(min:c) reduction(max:d) + for (i=0; i y[i]) c = y[i]; + d = fmaxf(d,x[i]); + } +} diff --git a/sources/Example_reduction.1f.f b/sources/Example_reduction.1f.f new file mode 100644 index 0000000..4b58299 --- /dev/null +++ b/sources/Example_reduction.1f.f @@ -0,0 +1,23 @@ +! @@name: reduction.1f +! @@type: F-free +! @@compilable: yes +! @@linkable: no +! @@expect: success +SUBROUTINE REDUCTION1(A, B, C, D, X, Y, N) + REAL :: X(*), A, D + INTEGER :: Y(*), N, B, C + INTEGER :: I + A = 0 + B = 0 + C = Y(1) + D = X(1) + !$OMP PARALLEL DO PRIVATE(I) SHARED(X, Y, N) REDUCTION(+:A) & + !$OMP& REDUCTION(IEOR:B) REDUCTION(MIN:C) REDUCTION(MAX:D) + DO I=1,N + A = A + X(I) + B = IEOR(B, Y(I)) + C = MIN(C, Y(I)) + IF (D < X(I)) D = X(I) + END DO + +END SUBROUTINE REDUCTION1 diff --git a/sources/Example_reduction.2c.c b/sources/Example_reduction.2c.c new file mode 100644 index 0000000..01ede12 --- /dev/null +++ b/sources/Example_reduction.2c.c @@ -0,0 +1,40 @@ +/* +* @@name: reduction.2c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +#include +#include +void reduction2(float *x, int *y, int n) +{ + int i, b, b_p, c, c_p; + float a, a_p, d, d_p; + a = 0.0f; + b = 0; + c = y[0]; + d = x[0]; + #pragma omp parallel shared(a, b, c, d, x, y, n) \ + private(a_p, b_p, c_p, d_p) + { + a_p = 0.0f; + b_p = 0; + c_p = INT_MAX; + d_p = -HUGE_VALF; + #pragma omp for private(i) + for (i=0; i y[i]) c_p = y[i]; + d_p = fmaxf(d_p,x[i]); + } + #pragma omp critical + { + a += a_p; + b ^= b_p; + if( c > c_p ) c = c_p; + d = fmaxf(d,d_p); + } + } +} diff --git a/sources/Example_reduction.2f.f b/sources/Example_reduction.2f.f new file mode 100644 index 0000000..4e396b2 --- /dev/null +++ b/sources/Example_reduction.2f.f @@ -0,0 +1,35 @@ +! @@name: reduction.2f +! @@type: F-free +! @@compilable: yes +! @@linkable: no +! @@expect: success + SUBROUTINE REDUCTION2(A, B, C, D, X, Y, N) + REAL :: X(*), A, D + INTEGER :: Y(*), N, B, C + REAL :: A_P, D_P + INTEGER :: I, B_P, C_P + A = 0 + B = 0 + C = Y(1) + D = X(1) + !$OMP PARALLEL SHARED(X, Y, A, B, C, D, N) & + !$OMP& PRIVATE(A_P, B_P, C_P, D_P) + A_P = 0.0 + B_P = 0 + C_P = HUGE(C_P) + D_P = -HUGE(D_P) + !$OMP DO PRIVATE(I) + DO I=1,N + A_P = A_P + X(I) + B_P = IEOR(B_P, Y(I)) + C_P = MIN(C_P, Y(I)) + IF (D_P < X(I)) D_P = X(I) + END DO + !$OMP CRITICAL + A = A + A_P + B = IEOR(B, B_P) + C = MIN(C, C_P) + D = MAX(D, D_P) + !$OMP END CRITICAL + !$OMP END PARALLEL + END SUBROUTINE REDUCTION2 diff --git a/sources/Example_reduction.3c.c b/sources/Example_reduction.3c.c new file mode 100644 index 0000000..4dd9dc6 --- /dev/null +++ b/sources/Example_reduction.3c.c @@ -0,0 +1,29 @@ +/* +* @@name: reduction.3c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: rt-error +*/ +#include + +int main (void) +{ + int a, i; + + #pragma omp parallel shared(a) private(i) + { + #pragma omp master + a = 0; + + // To avoid race conditions, add a barrier here. + + #pragma omp for reduction(+:a) + for (i = 0; i < 10; i++) { + a += i; + } + + #pragma omp single + printf ("Sum is %d\n", a); + } +} diff --git a/sources/Example_reduction.3f.f b/sources/Example_reduction.3f.f new file mode 100644 index 0000000..368b618 --- /dev/null +++ b/sources/Example_reduction.3f.f @@ -0,0 +1,20 @@ +! @@name: reduction.3f +! @@type: F-free +! @@compilable: no +! @@linkable: no +! @@expect: failure + PROGRAM REDUCTION_WRONG + MAX = HUGE(0) + M = 0 + + !$OMP PARALLEL DO REDUCTION(MAX: M) +! MAX is no longer the intrinsic so this is non-conforming + DO I = 1, 100 + CALL SUB(M,I) + END DO + + END PROGRAM REDUCTION_WRONG + + SUBROUTINE SUB(M,I) + M = MAX(M,I) + END SUBROUTINE SUB diff --git a/sources/Example_reduction.4f.f b/sources/Example_reduction.4f.f new file mode 100644 index 0000000..9fb784e --- /dev/null +++ b/sources/Example_reduction.4f.f @@ -0,0 +1,17 @@ +! @@name: reduction.4f +! @@type: F-free +! @@compilable: yes +! @@linkable: yes +! @@expect: success +MODULE M + INTRINSIC MAX +END MODULE M + +PROGRAM REDUCTION3 + USE M, REN => MAX + N = 0 +!$OMP PARALLEL DO REDUCTION(REN: N) ! still does MAX + DO I = 1, 100 + N = MAX(N,I) + END DO +END PROGRAM REDUCTION3 diff --git a/sources/Example_reduction.5f.f b/sources/Example_reduction.5f.f new file mode 100644 index 0000000..a1477cf --- /dev/null +++ b/sources/Example_reduction.5f.f @@ -0,0 +1,20 @@ +! @@name: reduction.5f +! @@type: F-free +! @@compilable: yes +! @@linkable: yes +! @@expect: success +MODULE MOD + INTRINSIC MAX, MIN +END MODULE MOD + +PROGRAM REDUCTION4 + USE MOD, MIN=>MAX, MAX=>MIN + REAL :: R + R = -HUGE(0.0) + +!$OMP PARALLEL DO REDUCTION(MIN: R) ! still does MAX + DO I = 1, 1000 + R = MIN(R, SIN(REAL(I))) + END DO + PRINT *, R +END PROGRAM REDUCTION4 diff --git a/sources/Example_reduction.6f.f b/sources/Example_reduction.6f.f new file mode 100644 index 0000000..eed2bab --- /dev/null +++ b/sources/Example_reduction.6f.f @@ -0,0 +1,26 @@ +! @@name: reduction.6f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: yes +! @@expect: rt-error + INTEGER A, I + +!$OMP PARALLEL SHARED(A) PRIVATE(I) + +!$OMP MASTER + A = 0 +!$OMP END MASTER + + ! To avoid race conditions, add a barrier here. + +!$OMP DO REDUCTION(+:A) + DO I= 0, 9 + A = A + I + END DO + +!$OMP SINGLE + PRINT *, "Sum is ", A +!$OMP END SINGLE + +!$OMP END PARALLEL + END diff --git a/sources/Example_set_dynamic_nthrs.1c.c b/sources/Example_set_dynamic_nthrs.1c.c new file mode 100644 index 0000000..a22a750 --- /dev/null +++ b/sources/Example_set_dynamic_nthrs.1c.c @@ -0,0 +1,29 @@ +/* +* @@name: set_dynamic_nthrs.1c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +#include +#include + +void do_by_16(float *x, int iam, int ipoints) {} + +void dynthreads(float *x, int npoints) +{ + int iam, ipoints; + + omp_set_dynamic(0); + omp_set_num_threads(16); + + #pragma omp parallel shared(x, npoints) private(iam, ipoints) + { + if (omp_get_num_threads() != 16) + abort(); + + iam = omp_get_thread_num(); + ipoints = npoints/16; + do_by_16(x, iam, ipoints); + } +} diff --git a/sources/Example_set_dynamic_nthrs.1f.f b/sources/Example_set_dynamic_nthrs.1f.f new file mode 100644 index 0000000..7fd3c0a --- /dev/null +++ b/sources/Example_set_dynamic_nthrs.1f.f @@ -0,0 +1,35 @@ +! @@name: set_dynamic_nthrs.1f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + SUBROUTINE DO_BY_16(X, IAM, IPOINTS) + REAL X(*) + INTEGER IAM, IPOINTS + END SUBROUTINE DO_BY_16 + + SUBROUTINE DYNTHREADS(X, NPOINTS) + + INCLUDE "omp_lib.h" ! or USE OMP_LIB + + INTEGER NPOINTS + REAL X(NPOINTS) + + INTEGER IAM, IPOINTS + + CALL OMP_SET_DYNAMIC(.FALSE.) + CALL OMP_SET_NUM_THREADS(16) + +!$OMP PARALLEL SHARED(X,NPOINTS) PRIVATE(IAM, IPOINTS) + + IF (OMP_GET_NUM_THREADS() .NE. 16) THEN + STOP + ENDIF + + IAM = OMP_GET_THREAD_NUM() + IPOINTS = NPOINTS/16 + CALL DO_BY_16(X,IAM,IPOINTS) + +!$OMP END PARALLEL + + END SUBROUTINE DYNTHREADS diff --git a/sources/Example_simple_lock.1c.c b/sources/Example_simple_lock.1c.c new file mode 100644 index 0000000..104ed63 --- /dev/null +++ b/sources/Example_simple_lock.1c.c @@ -0,0 +1,40 @@ +/* +* @@name: simple_lock.1c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: success +*/ +#include +#include +void skip(int i) {} +void work(int i) {} +int main() +{ + omp_lock_t lck; + int id; + omp_init_lock(&lck); + + #pragma omp parallel shared(lck) private(id) + { + id = omp_get_thread_num(); + + omp_set_lock(&lck); + /* only one thread at a time can execute this printf */ + printf("My thread id is %d.\n", id); + omp_unset_lock(&lck); + + while (! omp_test_lock(&lck)) { + skip(id); /* we do not yet have the lock, + so we must do something else */ + } + + work(id); /* we now have the lock + and can do the work */ + + omp_unset_lock(&lck); + } + omp_destroy_lock(&lck); + + return 0; +} diff --git a/sources/Example_simple_lock.1f.f b/sources/Example_simple_lock.1f.f new file mode 100644 index 0000000..e6e9b82 --- /dev/null +++ b/sources/Example_simple_lock.1f.f @@ -0,0 +1,41 @@ +! @@name: simple_lock.1f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: yes +! @@expect: success + SUBROUTINE SKIP(ID) + END SUBROUTINE SKIP + + SUBROUTINE WORK(ID) + END SUBROUTINE WORK + + PROGRAM SIMPLELOCK + + INCLUDE "omp_lib.h" ! or USE OMP_LIB + + INTEGER(OMP_LOCK_KIND) LCK + INTEGER ID + + CALL OMP_INIT_LOCK(LCK) + +!$OMP PARALLEL SHARED(LCK) PRIVATE(ID) + ID = OMP_GET_THREAD_NUM() + CALL OMP_SET_LOCK(LCK) + PRINT *, 'My thread id is ', ID + CALL OMP_UNSET_LOCK(LCK) + + DO WHILE (.NOT. OMP_TEST_LOCK(LCK)) + CALL SKIP(ID) ! We do not yet have the lock + ! so we must do something else + END DO + + CALL WORK(ID) ! We now have the lock + ! and can do the work + + CALL OMP_UNSET_LOCK( LCK ) + +!$OMP END PARALLEL + + CALL OMP_DESTROY_LOCK( LCK ) + + END PROGRAM SIMPLELOCK diff --git a/sources/Example_single.1c.c b/sources/Example_single.1c.c new file mode 100644 index 0000000..2169314 --- /dev/null +++ b/sources/Example_single.1c.c @@ -0,0 +1,30 @@ +/* +* @@name: single.1c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +#include + +void work1() {} +void work2() {} + +void single_example() +{ + #pragma omp parallel + { + #pragma omp single + printf("Beginning work1.\n"); + + work1(); + + #pragma omp single + printf("Finishing work1.\n"); + + #pragma omp single nowait + printf("Finished work1 and beginning work2.\n"); + + work2(); + } +} diff --git a/sources/Example_single.1f.f b/sources/Example_single.1f.f new file mode 100644 index 0000000..4ce6d85 --- /dev/null +++ b/sources/Example_single.1f.f @@ -0,0 +1,33 @@ +! @@name: single.1f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: yes +! @@expect: success + SUBROUTINE WORK1() + END SUBROUTINE WORK1 + + SUBROUTINE WORK2() + END SUBROUTINE WORK2 + + PROGRAM SINGLE_EXAMPLE +!$OMP PARALLEL + +!$OMP SINGLE + print *, "Beginning work1." +!$OMP END SINGLE + + CALL WORK1() + +!$OMP SINGLE + print *, "Finishing work1." +!$OMP END SINGLE + +!$OMP SINGLE + print *, "Finished work1 and beginning work2." +!$OMP END SINGLE NOWAIT + + CALL WORK2() + +!$OMP END PARALLEL + + END PROGRAM SINGLE_EXAMPLE diff --git a/sources/Example_standalone.1c.c b/sources/Example_standalone.1c.c new file mode 100644 index 0000000..1562fe7 --- /dev/null +++ b/sources/Example_standalone.1c.c @@ -0,0 +1,33 @@ +/* +* @@name: standalone.1c +* @@type: C +* @@compilable: no +* @@linkable: no +* @@expect: failure +*/ + +void standalone_wrong() +{ + int a = 1; + + if (a != 0) + #pragma omp flush(a) +/* incorrect as flush cannot be immediate substatement + of if statement */ + + if (a != 0) + #pragma omp barrier +/* incorrect as barrier cannot be immediate substatement + of if statement */ + + if (a!=0) + #pragma omp taskyield +/* incorrect as taskyield cannot be immediate substatement of if statement +*/ + + if (a != 0) + #pragma omp taskwait +/* incorrect as taskwait cannot be immediate substatement + of if statement */ + +} diff --git a/sources/Example_standalone.1f.f b/sources/Example_standalone.1f.f new file mode 100644 index 0000000..de8c3bb --- /dev/null +++ b/sources/Example_standalone.1f.f @@ -0,0 +1,46 @@ +! @@name: standalone.1f +! @@type: F-free +! @@compilable: no +! @@linkable: no +! @@expect: failure +SUBROUTINE STANDALONE_WRONG() + INTEGER A + A = 1 + ! the FLUSH directive must not be the action statement + ! in an IF statement + IF (A .NE. 0) !$OMP FLUSH(A) + + ! the BARRIER directive must not be the action statement + ! in an IF statement + IF (A .NE. 0) !$OMP BARRIER + + ! the TASKWAIT directive must not be the action statement + ! in an IF statement + IF (A .NE. 0) !$OMP TASKWAIT + + ! the TASKYIELD directive must not be the action statement + ! in an IF statement + IF (A .NE. 0) !$OMP TASKYIELD + + GOTO 100 + + ! the FLUSH directive must not be a labeled branch target + ! statement + 100 !$OMP FLUSH(A) + GOTO 200 + + ! the BARRIER directive must not be a labeled branch target + ! statement + 200 !$OMP BARRIER + GOTO 300 + + ! the TASKWAIT directive must not be a labeled branch target + ! statement + 300 !$OMP TASKWAIT + GOTO 400 + + ! the TASKYIELD directive must not be a labeled branch target + ! statement + 400 !$OMP TASKYIELD + +END SUBROUTINE diff --git a/sources/Example_standalone.2c.c b/sources/Example_standalone.2c.c new file mode 100644 index 0000000..cc14535 --- /dev/null +++ b/sources/Example_standalone.2c.c @@ -0,0 +1,27 @@ +/* +* @@name: standalone.2c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +void standalone_ok() +{ + int a = 1; + + #pragma omp parallel + { + if (a != 0) { + #pragma omp flush(a) + } + if (a != 0) { + #pragma omp barrier + } + if (a != 0) { + #pragma omp taskwait + } + if (a != 0) { + #pragma omp taskyield + } + } +} diff --git a/sources/Example_standalone.2f.f b/sources/Example_standalone.2f.f new file mode 100644 index 0000000..5e2347a --- /dev/null +++ b/sources/Example_standalone.2f.f @@ -0,0 +1,33 @@ +! @@name: standalone.2f +! @@type: F-free +! @@compilable: yes +! @@linkable: no +! @@expect: success +SUBROUTINE STANDALONE_OK() + INTEGER A + A = 1 + IF (A .NE. 0) THEN + !$OMP FLUSH(A) + ENDIF + IF (A .NE. 0) THEN + !$OMP BARRIER + ENDIF + IF (A .NE. 0) THEN + !$OMP TASKWAIT + ENDIF + IF (A .NE. 0) THEN + !$OMP TASKYIELD + ENDIF + GOTO 100 + 100 CONTINUE + !$OMP FLUSH(A) + GOTO 200 + 200 CONTINUE + !$OMP BARRIER + GOTO 300 + 300 CONTINUE + !$OMP TASKWAIT + GOTO 400 + 400 CONTINUE + !$OMP TASKYIELD +END SUBROUTINE diff --git a/sources/Example_target.1c.c b/sources/Example_target.1c.c new file mode 100644 index 0000000..d9d0820 --- /dev/null +++ b/sources/Example_target.1c.c @@ -0,0 +1,20 @@ +/* +* @@name: target.1c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +extern void init(float*, float*, int); +extern void output(float*, int); +void vec_mult(int N) +{ + int i; + float p[N], v1[N], v2[N]; + init(v1, v2, N); + #pragma omp target + #pragma omp parallel for private(i) + for (i=0; iTHRESHOLD1) map(to: v1[0:N], v2[:N])\ + map(from: p[0:N]) + #pragma omp parallel for if(N>THRESHOLD2) + for (i=0; iTHRESHHOLD1) map(to: v1, v2 ) map(from: p) + !$omp parallel do if(N>THRESHOLD2) + do i=1,N + p(i) = v1(i) * v2(i) + end do + !$omp end target + call output(p, N) +end subroutine diff --git a/sources/Example_target_data.1c.c b/sources/Example_target_data.1c.c new file mode 100644 index 0000000..9bfea76 --- /dev/null +++ b/sources/Example_target_data.1c.c @@ -0,0 +1,22 @@ +/* +* @@name: target_data.1c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +extern void init(float*, float*, int); +extern void output(float*, int); +void vec_mult(float *p, float *v1, float *v2, int N) +{ + int i; + init(v1, v2, N); + #pragma omp target data map(to: v1[0:N], v2[:N]) map(from: p[0:N]) + { + #pragma omp target + #pragma omp parallel for + for (i=0; i +void gramSchmidt(restrict float Q[][COLS], const int rows, const int cols) +{ + #pragma omp target data map(Q[0:rows][0:cols]) + for(int k=0; k < cols; k++) + { + double tmp = 0.0; + #pragma omp target + #pragma omp parallel for reduction(+:tmp) + for(int i=0; i < rows; i++) + tmp += (Q[i][k] * Q[i][k]); + tmp = 1/sqrt(tmp); + #pragma omp target + #pragma omp parallel for + for(int i=0; i < rows; i++) + Q[i][k] *= tmp; + } +} diff --git a/sources/Example_target_data.3f.f b/sources/Example_target_data.3f.f new file mode 100644 index 0000000..d1cea10 --- /dev/null +++ b/sources/Example_target_data.3f.f @@ -0,0 +1,27 @@ +! @@name: target_data.3f +! @@type: F-free +! @@compilable: yes +! @@linkable: no +! @@expect: success +subroutine gramSchmidt(Q,rows,cols) +integer :: rows,cols, i,k +double precision :: Q(rows,cols), tmp + !$omp target data map(Q) + do k=1,cols + tmp = 0.0d0 + !$omp target + !$omp parallel do reduction(+:tmp) + do i=1,rows + tmp = tmp + (Q(i,k) * Q(i,k)) + end do + !$omp end target + tmp = 1.0d0/sqrt(tmp) + !$omp target + !$omp parallel do + do i=1,rows + Q(i,k) = Q(i,k)*tmp + enddo + !$omp end target + end do + !$omp end target data +end subroutine diff --git a/sources/Example_target_data.4c.c b/sources/Example_target_data.4c.c new file mode 100644 index 0000000..e2de896 --- /dev/null +++ b/sources/Example_target_data.4c.c @@ -0,0 +1,26 @@ +/* +* @@name: target_data.4c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +void vec_mult(float*, float*, float*, int); +extern void init(float*, float*, int); +extern void output(float*, int); +void foo(float *p0, float *v1, float *v2, int N) +{ + init(v1, v2, N); + #pragma omp target data map(to: v1[0:N], v2[:N]) map(from: p0[0:N]) + { + vec_mult(p0, v1, v2, N); + } + output(p0, N); +} +void vec_mult(float *p1, float *v3, float *v4, int N) +{ + #pragma omp target map(to: v3[0:N], v4[:N]) map(from: p1[0:N]) + #pragma omp parallel for + for (i=0; iTHRESHOLD) map(from: p[0:N]) + { + #pragma omp target if (N>THRESHOLD) map(to: v1[:N], v2[:N]) + #pragma omp parallel for + for (i=0; iTHRESHOLD) map(to: v1[:N], v2[:N]) + #pragma omp parallel for + for (i=0; iTHRESHOLD) map(from: p) + !$omp target if(N>THRESHOLD) map(to: v1, v2) + !$omp parallel do + do i=1,N + p(i) = v1(i) * v2(i) + end do + !$omp end target + call init_again(v1, v2, N) + !$omp target if(N>THRESHOLD) map(to: v1, v2) + !$omp parallel do + do i=1,N + p(i) = p(i) + v1(i) * v2(i) + end do + !$omp end target + !$omp end target data + call output(p, N) +end subroutine diff --git a/sources/Example_target_data.7c.c b/sources/Example_target_data.7c.c new file mode 100644 index 0000000..138956c --- /dev/null +++ b/sources/Example_target_data.7c.c @@ -0,0 +1,23 @@ +/* +* @@name: target_data.7c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +#define THRESHOLD 1000000 +extern void init(float*, float*, int); +extern void output(float*, int); +void vec_mult(float *p, float *v1, float *v2, int N) +{ + int i; + init(v1, v2, N); + #pragma omp target data map(from: p[0:N]) + { + #pragma omp target if (N>THRESHOLD) map(to: v1[:N], v2[:N]) + #pragma omp parallel for + for (i=0; iTHRESHOLD) map(to: v1, v2) + !$omp parallel do + do i=1,N + p(i) = v1(i) * v2(i) + end do + !$omp end target + !$omp end target data + call output(p, N) !*** UNDEFINED behavior if N<=THRESHOLD +end subroutine diff --git a/sources/Example_target_update.1c.c b/sources/Example_target_update.1c.c new file mode 100644 index 0000000..f506b39 --- /dev/null +++ b/sources/Example_target_update.1c.c @@ -0,0 +1,29 @@ +/* +* @@name: target_update.1c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +extern void init(float *, float *, int); +extern void init_again(float *, float *, int); +extern void output(float *, int); +void vec_mult(float *p, float *v1, float *v2, int N) +{ + int i; + init(v1, v2, N); + #pragma omp target data map(to: v1[:N], v2[:N]) map(from: p[0:N]) + { + #pragma omp target + #pragma omp parallel for + for (i=0; ileft) + { + #pragma omp task + compute_tree(tree->left); + } + if (tree->right) + { + #pragma omp task + compute_tree(tree->right); + } + #pragma omp task + compute_something(tree); +} +int main() +{ + int i; + tree_type tree; + init_tree(tree); + #pragma omp parallel + #pragma omp single + { + #pragma omp task + start_background_work(); + for (i = 0; i < max_steps; i++) + { + #pragma omp taskgroup + { + #pragma omp task + compute_tree(tree); + } // wait on tree traversal in this step + check_step(); + } + } // only now is background work required to be complete + print_results(); +} diff --git a/sources/Example_taskgroup.1f.f b/sources/Example_taskgroup.1f.f new file mode 100644 index 0000000..fa93b77 --- /dev/null +++ b/sources/Example_taskgroup.1f.f @@ -0,0 +1,53 @@ +! @@name: taskgroup.1f +! @@type: F-free +! @@compilable: yes +! @@linkable: yes +! @@expect: success +module tree_type_mod + integer, parameter :: max_steps=100 + type tree_type + type(tree_type), pointer :: left, right + end type + contains + subroutine compute_something(tree) + type(tree_type), pointer :: tree +! some computation + end subroutine + recursive subroutine compute_tree(tree) + type(tree_type), pointer :: tree + if (associated(tree%left)) then +!$omp task + call compute_tree(tree%left) +!$omp end task + endif + if (associated(tree%right)) then +!$omp task + call compute_tree(tree%right) +!$omp end task + endif +!$omp task + call compute_something(tree) +!$omp end task + end subroutine +end module +program main + use tree_type_mod + type(tree_type), pointer :: tree + call init_tree(tree); +!$omp parallel +!$omp single +!$omp task + call start_background_work() +!$omp end task + do i=1, max_steps +!$omp taskgroup +!$omp task + call compute_tree(tree) +!$omp end task +!$omp end taskgroup ! wait on tree traversal in this step + call check_step() + enddo +!$omp end single +!$omp end parallel ! only now is background work required to be complete + call print_results() +end program diff --git a/sources/Example_tasking.10c.c b/sources/Example_tasking.10c.c new file mode 100644 index 0000000..9b1a929 --- /dev/null +++ b/sources/Example_tasking.10c.c @@ -0,0 +1,30 @@ +/* +* @@name: tasking.10c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +#include +void work() { + omp_lock_t lock; + omp_init_lock(&lock); +#pragma omp parallel + { + int i; +#pragma omp for + for (i = 0; i < 100; i++) { +#pragma omp task + { + // lock is shared by default in the task + omp_set_lock(&lock); + // Capture data for the following task +#pragma omp task + // Task Scheduling Point 1 + { /* do work here */ } + omp_unset_lock(&lock); + } + } + } + omp_destroy_lock(&lock); +} diff --git a/sources/Example_tasking.10f.f b/sources/Example_tasking.10f.f new file mode 100644 index 0000000..72f01ce --- /dev/null +++ b/sources/Example_tasking.10f.f @@ -0,0 +1,30 @@ +! @@name: tasking.10f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + module example + include 'omp_lib.h' + integer (kind=omp_lock_kind) lock + integer i + contains + subroutine work + call omp_init_lock(lock) +!$omp parallel + !$omp do + do i=1,100 + !$omp task + ! Outer task + call omp_set_lock(lock) ! lock is shared by + ! default in the task + ! Capture data for the following task + !$omp task ! Task Scheduling Point 1 + ! do work here + !$omp end task + call omp_unset_lock(lock) + !$omp end task + end do +!$omp end parallel + call omp_destroy_lock(lock) + end subroutine + end module diff --git a/sources/Example_tasking.11c.c b/sources/Example_tasking.11c.c new file mode 100644 index 0000000..f711073 --- /dev/null +++ b/sources/Example_tasking.11c.c @@ -0,0 +1,18 @@ +/* +* @@name: tasking.11c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +#include +void foo ( ) +{ + int x = 2; + #pragma omp task shared(x) mergeable + { + x++; + } + #pragma omp taskwait + printf("%d\n",x); // prints 3 +} diff --git a/sources/Example_tasking.11f.f b/sources/Example_tasking.11f.f new file mode 100644 index 0000000..3db2c63 --- /dev/null +++ b/sources/Example_tasking.11f.f @@ -0,0 +1,14 @@ +! @@name: tasking.11f +! @@type: F-free +! @@compilable: yes +! @@linkable: no +! @@expect: success +subroutine foo() + integer :: x + x = 2 +!$omp task shared(x) mergeable + x = x + 1 +!$omp end task +!$omp taskwait + print *, x ! prints 3 +end subroutine diff --git a/sources/Example_tasking.12c.c b/sources/Example_tasking.12c.c new file mode 100644 index 0000000..44d9e69 --- /dev/null +++ b/sources/Example_tasking.12c.c @@ -0,0 +1,18 @@ +/* +* @@name: tasking.12c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: rt-error +*/ +#include +void foo ( ) +{ + int x = 2; + #pragma omp task mergeable + { + x++; + } + #pragma omp taskwait + printf("%d\n",x); // prints 2 or 3 +} diff --git a/sources/Example_tasking.12f.f b/sources/Example_tasking.12f.f new file mode 100644 index 0000000..955b116 --- /dev/null +++ b/sources/Example_tasking.12f.f @@ -0,0 +1,14 @@ +! @@name: tasking.12f +! @@type: F-free +! @@compilable: yes +! @@linkable: no +! @@expect: rt-error +subroutine foo() + integer :: x + x = 2 +!$omp task mergeable + x = x + 1 +!$omp end task +!$omp taskwait + print *, x ! prints 2 or 3 +end subroutine diff --git a/sources/Example_tasking.13c.c b/sources/Example_tasking.13c.c new file mode 100644 index 0000000..27f6f6d --- /dev/null +++ b/sources/Example_tasking.13c.c @@ -0,0 +1,39 @@ +/* +* @@name: tasking.13c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +#include +#include +#define LIMIT 3 /* arbitrary limit on recursion depth */ +void check_solution(char *); +void bin_search (int pos, int n, char *state) +{ + if ( pos == n ) { + check_solution(state); + return; + } + #pragma omp task final( pos > LIMIT ) mergeable + { + char new_state[n]; + if (!omp_in_final() ) { + memcpy(new_state, state, pos ); + state = new_state; + } + state[pos] = 0; + bin_search(pos+1, n, state ); + } + #pragma omp task final( pos > LIMIT ) mergeable + { + char new_state[n]; + if (! omp_in_final() ) { + memcpy(new_state, state, pos ); + state = new_state; + } + state[pos] = 1; + bin_search(pos+1, n, state ); + } + #pragma omp taskwait +} diff --git a/sources/Example_tasking.13f.f b/sources/Example_tasking.13f.f new file mode 100644 index 0000000..d9426b2 --- /dev/null +++ b/sources/Example_tasking.13f.f @@ -0,0 +1,33 @@ +! @@name: tasking.13f +! @@type: F-free +! @@compilable: yes +! @@linkable: no +! @@expect: success +recursive subroutine bin_search(pos, n, state) + use omp_lib + integer :: pos, n + character, pointer :: state(:) + character, target, dimension(n) :: new_state1, new_state2 + integer, parameter :: LIMIT = 3 + if (pos .eq. n) then + call check_solution(state) + return + endif +!$omp task final(pos > LIMIT) mergeable + if (.not. omp_in_final()) then + new_state1(1:pos) = state(1:pos) + state => new_state1 + endif + state(pos+1) = 'z' + call bin_search(pos+1, n, state) +!$omp end task +!$omp task final(pos > LIMIT) mergeable + if (.not. omp_in_final()) then + new_state2(1:pos) = state(1:pos) + state => new_state2 + endif + state(pos+1) = 'y' + call bin_search(pos+1, n, state) +!$omp end task +!$omp taskwait +end subroutine diff --git a/sources/Example_tasking.14c.c b/sources/Example_tasking.14c.c new file mode 100644 index 0000000..381a13f --- /dev/null +++ b/sources/Example_tasking.14c.c @@ -0,0 +1,27 @@ +/* +* @@name: tasking.14c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +void foo ( ) +{ + int i; + #pragma omp task if(0) // This task is undeferred + { + #pragma omp task // This task is a regular task + for (i = 0; i < 3; i++) { + #pragma omp task // This task is a regular task + bar(); + } + } + #pragma omp task final(1) // This task is a regular task + { + #pragma omp task // This task is included + for (i = 0; i < 3; i++) { + #pragma omp task // This task is also included + bar(); + } + } +} diff --git a/sources/Example_tasking.14f.f b/sources/Example_tasking.14f.f new file mode 100644 index 0000000..8cfee6f --- /dev/null +++ b/sources/Example_tasking.14f.f @@ -0,0 +1,26 @@ +! @@name: tasking.14f +! @@type: F-free +! @@compilable: yes +! @@linkable: no +! @@expect: success +subroutine foo() +integer i +!$omp task if(.FALSE.) ! This task is undeferred +!$omp task ! This task is a regular task + do i = 1, 3 + !$omp task ! This task is a regular task + call bar() + !$omp end task + enddo +!$omp end task +!$omp end task +!$omp task final(.TRUE.) ! This task is a regular task +!$omp task ! This task is included + do i = 1, 3 + !$omp task ! This task is also included + call bar() + !$omp end task + enddo +!$omp end task +!$omp end task +end subroutine diff --git a/sources/Example_tasking.15c.c b/sources/Example_tasking.15c.c new file mode 100644 index 0000000..0191c91 --- /dev/null +++ b/sources/Example_tasking.15c.c @@ -0,0 +1,21 @@ +/* +* @@name: tasking.15c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: success +*/ +#include +int main() +{ + int x = 1; + #pragma omp parallel + #pragma omp single + { + #pragma omp task shared(x) depend(out: x) + x = 2; + #pragma omp task shared(x) depend(in: x) + printf("x = %d\n", x); + } + return 0; +} diff --git a/sources/Example_tasking.15f.f b/sources/Example_tasking.15f.f new file mode 100644 index 0000000..4fed17c --- /dev/null +++ b/sources/Example_tasking.15f.f @@ -0,0 +1,19 @@ +! @@name: tasking.15f +! @@type: F-free +! @@compilable: yes +! @@linkable: yes +! @@expect: success +program example + integer :: x + x = 1 + !$omp parallel + !$omp single + !$omp task shared(x) depend(out: x) + x = 2 + !$omp end task + !$omp task shared(x) depend(in: x) + print*, "x = ", x + !$omp end task + !$omp end single + !$omp end parallel +end program diff --git a/sources/Example_tasking.16c.c b/sources/Example_tasking.16c.c new file mode 100644 index 0000000..32b8443 --- /dev/null +++ b/sources/Example_tasking.16c.c @@ -0,0 +1,21 @@ +/* +* @@name: tasking.16c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: success +*/ +#include +int main() +{ + int x = 1; + #pragma omp parallel + #pragma omp single + { + #pragma omp task shared(x) depend(in: x) + printf("x = %d\n", x); + #pragma omp task shared(x) depend(out: x) + x = 2; + } + return 0; +} diff --git a/sources/Example_tasking.16f.f b/sources/Example_tasking.16f.f new file mode 100644 index 0000000..01f41b0 --- /dev/null +++ b/sources/Example_tasking.16f.f @@ -0,0 +1,19 @@ +! @@name: tasking.16f +! @@type: F-free +! @@compilable: yes +! @@linkable: yes +! @@expect: success +program example + integer :: x + x = 1 + !$omp parallel + !$omp single + !$omp task shared(x) depend(in: x) + print*, "x = ", x + !$omp end task + !$omp task shared(x) depend(out: x) + x = 2 + !$omp end task + !$omp end single + !$omp end parallel +end program diff --git a/sources/Example_tasking.17c.c b/sources/Example_tasking.17c.c new file mode 100644 index 0000000..1df0ac2 --- /dev/null +++ b/sources/Example_tasking.17c.c @@ -0,0 +1,23 @@ +/* +* @@name: tasking.17c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: success +*/ +#include +int main() +{ + int x; + #pragma omp parallel + #pragma omp single + { + #pragma omp task shared(x) depend(out: x) + x = 1; + #pragma omp task shared(x) depend(out: x) + x = 2; + #pragma omp taskwait + printf("x = %d\n", x); + } + return 0; +} diff --git a/sources/Example_tasking.17f.f b/sources/Example_tasking.17f.f new file mode 100644 index 0000000..e82cb57 --- /dev/null +++ b/sources/Example_tasking.17f.f @@ -0,0 +1,20 @@ +! @@name: tasking.17f +! @@type: F-free +! @@compilable: yes +! @@linkable: yes +! @@expect: success +program example + integer :: x + !$omp parallel + !$omp single + !$omp task shared(x) depend(out: x) + x = 1 + !$omp end task + !$omp task shared(x) depend(out: x) + x = 2 + !$omp end task + !$omp taskwait + print*, "x = ", x + !$omp end single + !$omp end parallel +end program diff --git a/sources/Example_tasking.18c.c b/sources/Example_tasking.18c.c new file mode 100644 index 0000000..a1eb0a1 --- /dev/null +++ b/sources/Example_tasking.18c.c @@ -0,0 +1,23 @@ +/* +* @@name: tasking.18c +* @@type: C +* @@compilable: yes +* @@linkable: yes +* @@expect: success +*/ +#include +int main() +{ + int x = 1; + #pragma omp parallel + #pragma omp single + { + #pragma omp task shared(x) depend(out: x) + x = 2; + #pragma omp task shared(x) depend(in: x) + printf("x + 1 = %d. ", x+1); + #pragma omp task shared(x) depend(in: x) + printf("x + 2 = %d\n", x+2); + } + return 0; +} diff --git a/sources/Example_tasking.18f.f b/sources/Example_tasking.18f.f new file mode 100644 index 0000000..42ee105 --- /dev/null +++ b/sources/Example_tasking.18f.f @@ -0,0 +1,22 @@ +! @@name: tasking.18f +! @@type: F-free +! @@compilable: yes +! @@linkable: yes +! @@expect: success +program example + integer :: x + x = 1 + !$omp parallel + !$omp single + !$omp task shared(x) depend(out: x) + x = 2 + !$omp end task + !$omp task shared(x) depend(in: x) + print*, "x + 1 = ", x+1, "." + !$omp end task + !$omp task shared(x) depend(in: x) + print*, "x + 2 = ", x+2, "." + !$omp end task + !$omp end single + !$omp end parallel +end program diff --git a/sources/Example_tasking.19c.c b/sources/Example_tasking.19c.c new file mode 100644 index 0000000..f7cfbe8 --- /dev/null +++ b/sources/Example_tasking.19c.c @@ -0,0 +1,25 @@ +/* +* @@name: tasking.19c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +// Assume BS divides N perfectly +void matmul_depend(int N, int BS, float A[N][N], float B[N][N], float +C[N][N] ) +{ + int i, j, k, ii, jj, kk; + for (i = 0; i < N; i+=BS) { + for (j = 0; j < N; j+=BS) { + for (k = 0; k < N; k+=BS) { +#pragma omp task depend ( in: A[i:BS][k:BS], B[k:BS][j:BS] ) \ + depend ( inout: C[i:BS][j:BS] ) + for (ii = i; ii < i+BS; ii++ ) + for (jj = j; jj < j+BS; jj++ ) + for (kk = k; kk < k+BS; kk++ ) + C[ii][jj] = C[ii][jj] + A[ii][kk] * B[kk][jj]; + } + } + } +} diff --git a/sources/Example_tasking.19f.f b/sources/Example_tasking.19f.f new file mode 100644 index 0000000..44dc306 --- /dev/null +++ b/sources/Example_tasking.19f.f @@ -0,0 +1,27 @@ +! @@name: tasking.19f +! @@type: F-free +! @@compilable: yes +! @@linkable: no +! @@expect: success +subroutine matmul_depend (N, BS, A, B, C) + integer :: N, BS, BM + real, dimension(N, N) :: A, B, C + integer :: i, j, k, ii, jj, kk + BM = BS -1 + do i = 1, N, BS + do j = 1, N, BS + do k = 1, N, BS +!$omp task depend ( in: A(i:i+BM, k:k+BM), B(k:k+BM, j:j+BM) ) & +!$omp depend ( inout: C(i:i+BM, j:j+BM) ) + do ii = i, i+BS + do jj = j, j+BS + do kk = k, k+BS + C(jj,ii) = C(jj,ii) + A(kk,ii) * B(jj,kk) + end do + end do + end do +!$omp end task + end do + end do + end do +end subroutine diff --git a/sources/Example_tasking.1c.c b/sources/Example_tasking.1c.c new file mode 100644 index 0000000..b8b855c --- /dev/null +++ b/sources/Example_tasking.1c.c @@ -0,0 +1,21 @@ +/* +* @@name: tasking.1c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +struct node { + struct node *left; + struct node *right; +}; +extern void process(struct node *); +void traverse( struct node *p ) { + if (p->left) +#pragma omp task // p is firstprivate by default + traverse(p->left); + if (p->right) +#pragma omp task // p is firstprivate by default + traverse(p->right); + process(p); +} diff --git a/sources/Example_tasking.1f.f b/sources/Example_tasking.1f.f new file mode 100644 index 0000000..c1ee1b2 --- /dev/null +++ b/sources/Example_tasking.1f.f @@ -0,0 +1,22 @@ +! @@name: tasking.1f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + RECURSIVE SUBROUTINE traverse ( P ) + TYPE Node + TYPE(Node), POINTER :: left, right + END TYPE Node + TYPE(Node) :: P + IF (associated(P%left)) THEN + !$OMP TASK ! P is firstprivate by default + call traverse(P%left) + !$OMP END TASK + ENDIF + IF (associated(P%right)) THEN + !$OMP TASK ! P is firstprivate by default + call traverse(P%right) + !$OMP END TASK + ENDIF + CALL process ( P ) + END SUBROUTINE diff --git a/sources/Example_tasking.2c.c b/sources/Example_tasking.2c.c new file mode 100644 index 0000000..e543ada --- /dev/null +++ b/sources/Example_tasking.2c.c @@ -0,0 +1,22 @@ +/* +* @@name: tasking.2c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +struct node { + struct node *left; + struct node *right; +}; +extern void process(struct node *); +void postorder_traverse( struct node *p ) { + if (p->left) + #pragma omp task // p is firstprivate by default + postorder_traverse(p->left); + if (p->right) + #pragma omp task // p is firstprivate by default + postorder_traverse(p->right); + #pragma omp taskwait + process(p); +} diff --git a/sources/Example_tasking.2f.f b/sources/Example_tasking.2f.f new file mode 100644 index 0000000..b5e2a5c --- /dev/null +++ b/sources/Example_tasking.2f.f @@ -0,0 +1,23 @@ +! @@name: tasking.2f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + RECURSIVE SUBROUTINE traverse ( P ) + TYPE Node + TYPE(Node), POINTER :: left, right + END TYPE Node + TYPE(Node) :: P + IF (associated(P%left)) THEN + !$OMP TASK ! P is firstprivate by default + call traverse(P%left) + !$OMP END TASK + ENDIF + IF (associated(P%right)) THEN + !$OMP TASK ! P is firstprivate by default + call traverse(P%right) + !$OMP END TASK + ENDIF + !$OMP TASKWAIT + CALL process ( P ) + END SUBROUTINE diff --git a/sources/Example_tasking.3c.c b/sources/Example_tasking.3c.c new file mode 100644 index 0000000..c83d36c --- /dev/null +++ b/sources/Example_tasking.3c.c @@ -0,0 +1,33 @@ +/* +* @@name: tasking.3c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +typedef struct node node; +struct node { + int data; + node * next; +}; + +void process(node * p) +{ + /* do work here */ +} +void increment_list_items(node * head) +{ + #pragma omp parallel + { + #pragma omp single + { + node * p = head; + while (p) { + #pragma omp task + // p is firstprivate by default + process(p); + p = p->next; + } + } + } +} diff --git a/sources/Example_tasking.3f.f b/sources/Example_tasking.3f.f new file mode 100644 index 0000000..0a96a58 --- /dev/null +++ b/sources/Example_tasking.3f.f @@ -0,0 +1,33 @@ +! @@name: tasking.3f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + MODULE LIST + TYPE NODE + INTEGER :: PAYLOAD + TYPE (NODE), POINTER :: NEXT + END TYPE NODE + CONTAINS + SUBROUTINE PROCESS(p) + TYPE (NODE), POINTER :: P + ! do work here + END SUBROUTINE + SUBROUTINE INCREMENT_LIST_ITEMS (HEAD) + TYPE (NODE), POINTER :: HEAD + TYPE (NODE), POINTER :: P + !$OMP PARALLEL PRIVATE(P) + !$OMP SINGLE + P => HEAD + DO + !$OMP TASK + ! P is firstprivate by default + CALL PROCESS(P) + !$OMP END TASK + P => P%NEXT + IF ( .NOT. ASSOCIATED (P) ) EXIT + END DO + !$OMP END SINGLE + !$OMP END PARALLEL + END SUBROUTINE + END MODULE diff --git a/sources/Example_tasking.4c.c b/sources/Example_tasking.4c.c new file mode 100644 index 0000000..a7b1fb6 --- /dev/null +++ b/sources/Example_tasking.4c.c @@ -0,0 +1,20 @@ +/* +* @@name: tasking.4c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ + int fib(int n) { + int i, j; + if (n<2) + return n; + else { + #pragma omp task shared(i) + i=fib(n-1); + #pragma omp task shared(j) + j=fib(n-2); + #pragma omp taskwait + return i+j; + } + } diff --git a/sources/Example_tasking.4f.f b/sources/Example_tasking.4f.f new file mode 100644 index 0000000..5d31316 --- /dev/null +++ b/sources/Example_tasking.4f.f @@ -0,0 +1,20 @@ +! @@name: tasking.4f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + RECURSIVE INTEGER FUNCTION fib(n) RESULT(res) + INTEGER n, i, j + IF ( n .LT. 2) THEN + res = n + ELSE +!$OMP TASK SHARED(i) + i = fib( n-1 ) +!$OMP END TASK +!$OMP TASK SHARED(j) + j = fib( n-2 ) +!$OMP END TASK +!$OMP TASKWAIT + res = i+j + END IF + END FUNCTION diff --git a/sources/Example_tasking.5c.c b/sources/Example_tasking.5c.c new file mode 100644 index 0000000..7d9c27f --- /dev/null +++ b/sources/Example_tasking.5c.c @@ -0,0 +1,23 @@ +/* +* @@name: tasking.5c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +#define LARGE_NUMBER 10000000 +double item[LARGE_NUMBER]; +extern void process(double); + +int main() { +#pragma omp parallel + { + #pragma omp single + { + int i; + for (i=0; i + +void something_useful ( void ); +void something_critical ( void ); +void foo ( omp_lock_t * lock, int n ) +{ + int i; + + for ( i = 0; i < n; i++ ) + #pragma omp task + { + something_useful(); + while ( !omp_test_lock(lock) ) { + #pragma omp taskyield + } + something_critical(); + omp_unset_lock(lock); + } +} diff --git a/sources/Example_taskyield.1f.f b/sources/Example_taskyield.1f.f new file mode 100644 index 0000000..c5523dc --- /dev/null +++ b/sources/Example_taskyield.1f.f @@ -0,0 +1,23 @@ +! @@name: taskyield.1f +! @@type: F-free +! @@compilable: yes +! @@linkable: no +! @@expect: success +subroutine foo ( lock, n ) + use omp_lib + integer (kind=omp_lock_kind) :: lock + integer n + integer i + + do i = 1, n + !$omp task + call something_useful() + do while ( .not. omp_test_lock(lock) ) + !$omp taskyield + end do + call something_critical() + call omp_unset_lock(lock) + !$omp end task + end do + +end subroutine diff --git a/sources/Example_teams.1c.c b/sources/Example_teams.1c.c new file mode 100644 index 0000000..a9429f7 --- /dev/null +++ b/sources/Example_teams.1c.c @@ -0,0 +1,34 @@ +/* +* @@name: teams.1c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +#include +#include +float dotprod(float B[], float C[], int N) +{ + float sum0 = 0.0; + float sum1 = 0.0; + #pragma omp target map(to: B[:N], C[:N]) + #pragma omp teams num_teams(2) + { + int i; + if (omp_get_num_teams() != 2) + abort(); + if (omp_get_team_num() == 0) + { + #pragma omp parallel for reduction(+:sum0) + for (i=0; i TARG + I = 5 + +!$OMP PARALLEL COPYIN(I, PTR) +!$OMP CRITICAL + IF (FIRSTIN) THEN + TARG = 4 ! Update target of ptr + I = I + 10 + IF (ALLOCATED(A)) A = A + 10 + FIRSTIN = .FALSE. + END IF + + IF (ALLOCATED(A)) THEN + PRINT *, 'a = ', A + ELSE + PRINT *, 'A is not allocated' + END IF + + PRINT *, 'ptr = ', PTR + PRINT *, 'i = ', I + PRINT * + +!$OMP END CRITICAL +!$OMP END PARALLEL + END PROGRAM INC_GOOD2 diff --git a/sources/Example_threadprivate.6f.f b/sources/Example_threadprivate.6f.f new file mode 100644 index 0000000..d614fed --- /dev/null +++ b/sources/Example_threadprivate.6f.f @@ -0,0 +1,30 @@ +! @@name: threadprivate.6f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: yes +! @@expect: success + MODULE INC_MODULE_GOOD3 + REAL, POINTER :: WORK(:) + SAVE WORK +!$OMP THREADPRIVATE(WORK) + END MODULE INC_MODULE_GOOD3 + + SUBROUTINE SUB1(N) + USE INC_MODULE_GOOD3 +!$OMP PARALLEL PRIVATE(THE_SUM) + ALLOCATE(WORK(N)) + CALL SUB2(THE_SUM) + WRITE(*,*)THE_SUM +!$OMP END PARALLEL + END SUBROUTINE SUB1 + + SUBROUTINE SUB2(THE_SUM) + USE INC_MODULE_GOOD3 + WORK(:) = 10 + THE_SUM=SUM(WORK) + END SUBROUTINE SUB2 + + PROGRAM INC_GOOD3 + N = 10 + CALL SUB1(N) + END PROGRAM INC_GOOD3 diff --git a/sources/Example_workshare.1f.f b/sources/Example_workshare.1f.f new file mode 100644 index 0000000..c77c4de --- /dev/null +++ b/sources/Example_workshare.1f.f @@ -0,0 +1,18 @@ +! @@name: workshare.1f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + SUBROUTINE WSHARE1(AA, BB, CC, DD, EE, FF, N) + INTEGER N + REAL AA(N,N), BB(N,N), CC(N,N), DD(N,N), EE(N,N), FF(N,N) + +!$OMP PARALLEL +!$OMP WORKSHARE + AA = BB + CC = DD + EE = FF +!$OMP END WORKSHARE +!$OMP END PARALLEL + + END SUBROUTINE WSHARE1 diff --git a/sources/Example_workshare.2f.f b/sources/Example_workshare.2f.f new file mode 100644 index 0000000..76f9475 --- /dev/null +++ b/sources/Example_workshare.2f.f @@ -0,0 +1,20 @@ +! @@name: workshare.2f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + SUBROUTINE WSHARE2(AA, BB, CC, DD, EE, FF, N) + INTEGER N + REAL AA(N,N), BB(N,N), CC(N,N) + REAL DD(N,N), EE(N,N), FF(N,N) + +!$OMP PARALLEL +!$OMP WORKSHARE + AA = BB + CC = DD +!$OMP END WORKSHARE NOWAIT +!$OMP WORKSHARE + EE = FF +!$OMP END WORKSHARE +!$OMP END PARALLEL + END SUBROUTINE WSHARE2 diff --git a/sources/Example_workshare.3f.f b/sources/Example_workshare.3f.f new file mode 100644 index 0000000..3eb8334 --- /dev/null +++ b/sources/Example_workshare.3f.f @@ -0,0 +1,19 @@ +! @@name: workshare.3f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + SUBROUTINE WSHARE3(AA, BB, CC, DD, N) + INTEGER N + REAL AA(N,N), BB(N,N), CC(N,N), DD(N,N) + REAL R + R=0 +!$OMP PARALLEL +!$OMP WORKSHARE + AA = BB +!$OMP ATOMIC UPDATE + R = R + SUM(AA) + CC = DD +!$OMP END WORKSHARE +!$OMP END PARALLEL + END SUBROUTINE WSHARE3 diff --git a/sources/Example_workshare.4f.f b/sources/Example_workshare.4f.f new file mode 100644 index 0000000..af945aa --- /dev/null +++ b/sources/Example_workshare.4f.f @@ -0,0 +1,21 @@ +! @@name: workshare.4f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + SUBROUTINE WSHARE4(AA, BB, CC, DD, EE, FF, GG, HH, N) + INTEGER N + REAL AA(N,N), BB(N,N), CC(N,N) + REAL DD(N,N), EE(N,N), FF(N,N) + REAL GG(N,N), HH(N,N) + +!$OMP PARALLEL +!$OMP WORKSHARE + AA = BB + CC = DD + WHERE (EE .ne. 0) FF = 1 / EE + GG = HH +!$OMP END WORKSHARE +!$OMP END PARALLEL + + END SUBROUTINE WSHARE4 diff --git a/sources/Example_workshare.5f.f b/sources/Example_workshare.5f.f new file mode 100644 index 0000000..612bae6 --- /dev/null +++ b/sources/Example_workshare.5f.f @@ -0,0 +1,20 @@ +! @@name: workshare.5f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + SUBROUTINE WSHARE5(AA, BB, CC, DD, N) + INTEGER N + REAL AA(N,N), BB(N,N), CC(N,N), DD(N,N) + + INTEGER SHR + +!$OMP PARALLEL SHARED(SHR) +!$OMP WORKSHARE + AA = BB + SHR = 1 + CC = DD * SHR +!$OMP END WORKSHARE +!$OMP END PARALLEL + + END SUBROUTINE WSHARE5 diff --git a/sources/Example_workshare.6f.f b/sources/Example_workshare.6f.f new file mode 100644 index 0000000..5b4f6dd --- /dev/null +++ b/sources/Example_workshare.6f.f @@ -0,0 +1,20 @@ +! @@name: workshare.6f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + SUBROUTINE WSHARE6_WRONG(AA, BB, CC, DD, N) + INTEGER N + REAL AA(N,N), BB(N,N), CC(N,N), DD(N,N) + + INTEGER PRI + +!$OMP PARALLEL PRIVATE(PRI) +!$OMP WORKSHARE + AA = BB + PRI = 1 + CC = DD * PRI +!$OMP END WORKSHARE +!$OMP END PARALLEL + + END SUBROUTINE WSHARE6_WRONG diff --git a/sources/Example_workshare.7f.f b/sources/Example_workshare.7f.f new file mode 100644 index 0000000..51a086e --- /dev/null +++ b/sources/Example_workshare.7f.f @@ -0,0 +1,17 @@ +! @@name: workshare.7f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + SUBROUTINE WSHARE7(AA, BB, CC, N) + INTEGER N + REAL AA(N), BB(N), CC(N) + +!$OMP PARALLEL +!$OMP WORKSHARE + AA(1:50) = BB(11:60) + CC(11:20) = AA(1:10) +!$OMP END WORKSHARE +!$OMP END PARALLEL + + END SUBROUTINE WSHARE7 diff --git a/sources/Example_worksharing_critical.1c.c b/sources/Example_worksharing_critical.1c.c new file mode 100644 index 0000000..61bf0f4 --- /dev/null +++ b/sources/Example_worksharing_critical.1c.c @@ -0,0 +1,27 @@ +/* +* @@name: worksharing_critical.1c +* @@type: C +* @@compilable: yes +* @@linkable: no +* @@expect: success +*/ +void critical_work() +{ + int i = 1; + #pragma omp parallel sections + { + #pragma omp section + { + #pragma omp critical (name) + { + #pragma omp parallel + { + #pragma omp single + { + i++; + } + } + } + } + } +} diff --git a/sources/Example_worksharing_critical.1f.f b/sources/Example_worksharing_critical.1f.f new file mode 100644 index 0000000..f57f2b7 --- /dev/null +++ b/sources/Example_worksharing_critical.1f.f @@ -0,0 +1,21 @@ +! @@name: worksharing_critical.1f +! @@type: F-fixed +! @@compilable: yes +! @@linkable: no +! @@expect: success + SUBROUTINE CRITICAL_WORK() + + INTEGER I + I = 1 + +!$OMP PARALLEL SECTIONS +!$OMP SECTION +!$OMP CRITICAL (NAME) +!$OMP PARALLEL +!$OMP SINGLE + I = I + 1 +!$OMP END SINGLE +!$OMP END PARALLEL +!$OMP END CRITICAL (NAME) +!$OMP END PARALLEL SECTIONS + END SUBROUTINE CRITICAL_WORK