multithreading - Openmp:与omp_get_thread

multithreading - Openmp:与omp_get_thread_num()并行使用

转载作者：行者123 更新时间：2023-12-03 13:16:31

我正在使用parallel do和private子句拆分do循环。在此循环中，我向自身添加了一个变量。如果在这种情况下不需要关键语句或原子语句，为什么会出现错误？
我该如何解决？

program trap
use omp_lib 
implicit none
double precision::suma=0.d0 ! sum is a scalar
double precision:: h,x,lima,limb
integer::n,i, istart, iend, thread_num=4, total_threads, ppt
integer(kind=8):: tic, toc, rate
double precision:: time
double precision, dimension(4):: pi= 0.d0

call system_clock(count_rate = rate)
call system_clock(tic)

lima=0.0d0; limb=1.0d0; suma=0.0d0; n=100000000
h=(limb-lima)/n

suma=h*(f(lima)+f(limb))*0.5d0 !first and last points

ppt= n/total_threads
!$ call omp_set_num_threads(total_threads)

!$omp parallel do private (istart, iend, thread_num, i)
  thread_num = omp_get_thread_num()
  !$ istart = thread_num*ppt +1
  !$ iend = min(thread_num*ppt + ppt, n)
do i=istart,iend ! this will control the loop in different threads
  x=lima+i*h
  suma=suma+f(x) 
  pi(thread_num+1)=suma
enddo
!$omp end parallel do 

suma=sum(pi) 
suma=suma*h

print *,"The value of pi is= ",suma ! print once from the first image

call system_clock(toc)
time = real(toc-tic)/real(rate)
print*, 'Time ', time, 's'

contains

double precision function f(y)
double precision:: y
f=4.0d0/(1.0d0+y*y)
end function f

end program trap

我收到以下错误:
test.f90:23:35:
23 | thread_num = omp_get_thread_num()
错误:(1)处的意外赋值语句
test.f90:24:31:
24 | !$ istart = thread_num * ppt +1
错误:(1)处的意外赋值语句
test.f90:25:40:
25 | !$ iend = min(thread_num * ppt + ppt，n)
错误:(1)处的意外赋值语句
编译:

gfortran -fopenmp -Wall -Wextra -O2 -Wall -o prog.exe test.f90 

./prog.exe

最佳答案

我不明白为什么当openmp中的工作共享构造(例如!$omp do)可以为您自动执行此操作时，为什么要手动拆分循环。下面是我会怎么做

ian@eris:~/work/stack$ cat thread.f90
program trap
  Use, Intrinsic :: iso_fortran_env, Only :  wp => real64, li => int64
  use omp_lib 
  implicit none
  Real( wp ) ::suma=0.0_wp ! sum is a scalar
  Real( wp ) :: h,x,lima,limb
  integer(li):: tic, toc, rate
  Real( wp ) :: time
  Real( wp ) :: pi
  Integer :: i, n

  call system_clock(count_rate = rate)
  call system_clock(tic)

  lima=0.0_wp; limb=1.0_wp; suma=0.0_wp; n=100000000
  h=(limb-lima)/n

  suma=h*(f(lima)+f(limb))*0.5_wp !first and last points

  pi = 0.0_wp
  !$omp parallel default( None ) private( i, x, lima ) &
  !$omp                          shared( pi, n, h )
  !$omp do reduction( +:pi )
  do i= 1, n
     x  = lima + i * h
     pi = pi + f( x ) 
  enddo
  !$omp end do
  !$omp end parallel

  print *,"The value of pi is= ", pi / n

  call system_clock(toc)
  time = real(toc-tic)/real(rate)
  print*, 'Time ', time, 's on ', omp_get_max_threads(), ' threads'

contains

  function f(y)
    Real( wp ) :: f
    Real( wp ) :: y
    f=4.0_wp/(1.0_wp+y*y)
  end function f

end program trap
ian@eris:~/work/stack$ gfortran --version
GNU Fortran (Ubuntu 7.4.0-1ubuntu1~18.04.1) 7.4.0
Copyright (C) 2017 Free Software Foundation, Inc.
This is free software; see the source for copying conditions.  There is NO
warranty; not even for MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.

ian@eris:~/work/stack$ export OMP_NUM_THREADS=1
ian@eris:~/work/stack$ ./a.out
 The value of pi is=    3.1415926435902248     
 Time    1.8548842668533325      s on            1  threads
ian@eris:~/work/stack$ export OMP_NUM_THREADS=2
ian@eris:~/work/stack$ ./a.out
 The value of pi is=    3.1415926435902120     
 Time   0.86763000488281250      s on            2  threads
ian@eris:~/work/stack$ export OMP_NUM_THREADS=4
ian@eris:~/work/stack$ ./a.out
 The value of pi is=    3.1415926435898771     
 Time   0.54704123735427856      s on            4  threads
ian@eris:~/work/stack$

关于multithreading - Openmp:与omp_get_thread_num()并行使用，我们在Stack Overflow上找到一个类似的问题： https://stackoverflow.com/questions/66604498/

文章推荐： c++ - C++ 11中与std::atomic的同步

文章推荐： c++ - C++线程加入后不会中止

文章推荐： c++ - 在函数周围调用std::thread()的工作方式不同

c++ - omp_get_thread_num() 返回有问题的数字？
代码有几千行，所以我不能粘贴它们，但是函数流程看起来有点像: void Func_1(double * x, int nx, NUM_THREADS) { omp_set_num_threads(
multithreading - omp_get_num_threads() 和 omp_get_thread_num() 返回废话
我刚开始使用英特尔 Fortran 编译器和 Visual Studio 2015 在 Fortran 中使用 OpenMP。在项目属性中，我将“Fortran -> 语言 -> 处理 OpenMP
c++ - 使用 omp_get_thread_num 索引全局 vector 是否安全？
我有一个这样的代码: thread_local CustomAllocator* ts_alloc = nullptr; struct AllocatorSetup { AllocatorSe
c++ - 避免使用 simd 并行调用 omp_get_thread_num() for 循环
与查找变量值相比，调用 omp_get_thread_num() 的性能成本是多少？如何避免在 simd openmp 循环中多次调用 omp_get_thread_num()？我可以使用 #pr
c++ - omp_set_num_threads 总是返回 0 并且我无法使用 omp_get_thread_num() 获取线程号
我有一个使用 omp 进行并行化的 C++ 类库。我注意到我的问题，因为它总是用完我处理器上的所有内核，不管 omp_set_num_threads(threadCount) 有什么作为输入。所以在
c++ - 在 openmp 中，omp_get_thread_num 是否绑定(bind)到物理线程？
我了解到 OpenMP 使用线程池来重用物理线程。我的问题是从omp_get_thread_num 获取的线程号是否绑定(bind)到物理线程？换句话说，omp_get_thread_num 到 g

行者123

个人简介

我是一名优秀的程序员,十分优秀！

作者热门文章

滴滴打车优惠券免费领取

全站热门文章

首页

博学

6Ren·AI

商城

multithreading - Openmp:与omp_get_thread_num()并行使用