analysis.py 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411
  1. #analysis functions for cardiacSPECT dynamic data analysis
  2. #see clusterAnalysis.ipynb for details on usage
  3. import os
  4. import getData
  5. import config
  6. import subprocess
  7. import SimpleITK
  8. import numpy
  9. import re
  10. import json
  11. import segmentation
  12. def calculateCenters(db,setup):
  13. #path of scripts is ../scripts
  14. #one up
  15. #scriptPath
  16. rows=getData.getPatients(db,setup)
  17. # $MATLAB -sd $MATLABSCRIPTDIR -batch "patientID='${PATIENTID}'; nclass='${NCLASS}'; nRealizations='${NR}'; generateCenters" >& ~/logs/dynamicSPECT.log;
  18. for r in rows:
  19. #download
  20. calculateRowCenters(r,setup)
  21. def calculateRowCenters(r,setup):
  22. cmds=config.cmdMatlab()
  23. tempDir=config.getTempDir(setup)
  24. code=config.getCode(r,setup)
  25. nr=setup['nr']
  26. nclass=setup['nclass']
  27. for nc in nclass:
  28. runCmds=[x for x in cmds]
  29. runCmds.append('-r "path=\'{}\'; patientID=\'{}\'; nclass=\'{}\'; nRealizations=\'{}\'; generateCenters"'.format(tempDir,code,nc,nr))
  30. print('centers: {}/{},{}'.format(code,nc,nr))
  31. #redirect and print output to stdout
  32. print(runCmds)
  33. print(subprocess.run(runCmds, check=True, stdout=subprocess.PIPE).stdout)
  34. def doAnalysis(db,setup,mode):
  35. rows=getData.getPatients(db,setup)
  36. for r in rows:
  37. doAnalysisRow(r,xsetup,mode)
  38. def doAnalysisRow(r,xsetup,mode):
  39. cmds=config.cmdMatlab()
  40. tempDir=config.getTempDir(xsetup)
  41. #this is if IVF is inferred together with k1 fits
  42. #runScript='doAnalysis.sh'
  43. #this is if IVF is taken from previous cluster fits
  44. #runScript='doAnalysisIVF.sh'
  45. if mode=='global':
  46. mScript='analyze'
  47. analysisType=''
  48. if mode=='IVF':
  49. mScript='analyzeIVF'
  50. analysisType='IVF_'
  51. try:
  52. print('Setting runScript to {}'.format(mScript))
  53. except NameError:
  54. print('Mode can be one of (global,IVF))')
  55. return
  56. code=config.getCode(r,xsetup)
  57. nr=xsetup['nr']
  58. nclass=xsetup['nclass']
  59. for nc in nclass:
  60. for j in numpy.arange(nr):
  61. print('{} [{} {}/{}]'.format(code,nc,j+1,nr))
  62. #avoid repetition, only do for new files
  63. #this is a duplicate of path generated in fitCenters.m
  64. fName=os.path.join(tempDir,code,config.getFitParFinalName(code,nc,j,analysisType))
  65. if os.path.isfile(fName):
  66. print('Skipping; {} available.'.format(fName))
  67. continue
  68. runCmds=[x for x in cmds]
  69. runCmds.append('-r "path=\'{}\'; patientID=\'{}\'; nclass=\'{}\'; realizationId=\'{}\'; {}"'.format(tempDir,code,nc,j+1,mScript))
  70. subprocess.run(runCmds,check=True, stdout=subprocess.PIPE)
  71. def doPixelAnalysis(db,setup,sigma2,mode='IVF'):
  72. baseDir=os.path.dirname(os.getcwd())#one up
  73. rows=getData.getPatients(db,setup)
  74. for r in rows:
  75. doPixelAnalysisRow(r,setup,mode)
  76. def doPixelAnalysisRow(r,setup, mode='IVF'):
  77. cmds=config.cmdMatlab()
  78. tempDir=config.getTempDir(setup)
  79. #
  80. #in global mode, IVF parameters are inferred together with fits to classes
  81. #this is essentially repeat of the above, except that classes are taken as
  82. #time-response curves from pixels in the sigma2-defined neighborhood of
  83. #target pixels
  84. if mode=='global':
  85. mScript='analyzePixel'
  86. analysisType=''
  87. if mode=='IVF':
  88. mScript='analyzePixelIVF'
  89. analysisType='IVF_'
  90. #in IVF mode, the parameters of input function are taken from the cluster fit
  91. #(doAnalysis above, with mode=general). The rest is the same as for global mode
  92. try:
  93. print('Setting runScript to {}'.format(mScript))
  94. except NameError:
  95. print('Mode can be one of (global,IVF))')
  96. return
  97. #code=config.getCode(r,setup)
  98. nc=segmentation.getNC(r,setup)
  99. #loadSegmentation(db,fb,r,setup)
  100. #nc=x.shape[0]
  101. sigma2=setup['sigma2']
  102. code=config.getCode(r,setup)
  103. for s2 in sigma2:
  104. f=config.getPixelFitParFinalName(code,nc,s2,mode)
  105. fName=getData.getLocalPath(r,setup,f)
  106. sFile=segmentation.getSegmentationFileName(r,setup)
  107. segmFile=getData.getLocalPath(r,setup,sFile)
  108. if os.path.isfile(fName):
  109. print('Skipping; {} available.'.format(fName))
  110. continue
  111. runCmds=[x for x in cmds]
  112. runCmds.append('-r "path=\'{}\'; patientID=\'{}\'; sigma2=\'{}\' segmFile=\'{}\'; {}"'.format(tempDir,code,s2,segmFile,mScript))
  113. subprocess.run(runCmds,check=True, stdout=subprocess.PIPE)
  114. def getIWeights(r,setup,nclass,realizationId,ic):
  115. locDir=config.getLocalDir(r,setup)
  116. code=config.getCode(r,setup)
  117. fname='{}_{}_{}_center{}_centerWeigth.nrrd'.\
  118. format(code,nclass,realizationId+1,ic+1)
  119. uFile=os.path.join(locDir,fname)
  120. imU=SimpleITK.ReadImage(uFile)
  121. return SimpleITK.GetArrayFromImage(imU)
  122. def getGaussianWeight(nU,pt,sigma2,na):
  123. #gaussian weighted summation of surrounding pixels
  124. #find point closest to the target point
  125. idx=[int(x) for x in pt]
  126. #running offset
  127. fidx=numpy.zeros(3)
  128. #half of the neighborhood
  129. na2=0.5*(na-1)
  130. fs=0
  131. fWeight=0
  132. for i in numpy.arange(na):
  133. fidx[0]=idx[0]+(i-na2)
  134. for j in numpy.arange(na):
  135. fidx[1]=idx[1]+(j-na2)
  136. for k in numpy.arange(na):
  137. fidx[2]=idx[2]+(k-na2)
  138. fidx=[int(x) for x in fidx]
  139. fd=numpy.array(fidx)-numpy.array(pt)
  140. dist2=numpy.sum(fd*fd)
  141. fw=numpy.exp(-0.5*dist2/sigma2);
  142. fs+=fw
  143. fWeight+=fw*nU[tuple(fidx)]
  144. #print('\t{}/{}: {}/{:.2f} {:.2g} {:.3g} {:.2g}'.format(idx,fidx,numpy.sqrt(dist2),fw,nU[tuple(fidx)],fs,fWeight))
  145. fWeight/=fs
  146. return fWeight
  147. #gets weights by class for a particular realization and sigma2 averaging
  148. def getWeights(db,r,setup,nclass,realizationId,sigma2,na):
  149. #for w1, classes are in 0 to nclass-1 space
  150. #na is the size of the neighborhood
  151. idFilter=config.getIdFilter(r,setup)
  152. visitFilter=config.getVisitFilter(r,setup)
  153. code=config.getCode(r,setup)
  154. rows=getData.getSegmentation(db,setup,[idFilter,visitFilter])
  155. pts={r['regionId']:[float(x) for x in [r['x'],r['y'],r['z']]] for r in rows}
  156. w={region:numpy.zeros(nclass) for region in pts}
  157. na2=0.5*(na-1)
  158. for c in numpy.arange(nclass):
  159. nU=getIWeights(r,setup,nclass,realizationId,c)
  160. for region in w:
  161. #print(pts[region])
  162. #print('{} {}/{} {}'.format(code,c,nclass,region))
  163. #gaussian weighted summation of surrounding pixels
  164. w[region][c]=getGaussianWeight(nU,pts[region],sigma2,na)
  165. return w
  166. #gets fitPar for a particular realization in [0..nr-1] range
  167. def getPixelFitPar(fb,r,setup,nc,s2,mode):
  168. code=config.getCode(r,setup)
  169. f=config.getPixelFitParFinalName(code,nc,s2,mode)
  170. print('getPixelFitPar {}'.format(f))
  171. getData.copyFromServer(fb,r,setup,[f])
  172. fName=getData.getLocalPath(r,setup,f)
  173. print('getPixelFitPar {}'.format(fName))
  174. return numpy.genfromtxt(fName,delimiter='\t')
  175. def getFitPar(fb,r,setup,nclass,realizationId,mode):
  176. code=config.getCode(r,setup)
  177. f=config.getFitParFinalName(code,nclass,realizationId,mode)
  178. getData.copyFromServer(fb,r,setup,[f])
  179. fName=getData.getLocalPath(r,setup,f)
  180. return numpy.genfromtxt(fName,delimiter='\t')
  181. def getFitParBackup(r,setup,nclass,realizationId,mode=''):
  182. #fitGoodnes A tau alpha delay [k1 BVF k2 delay]xNcenters
  183. allowedModes=['','IVF','Pixel','PixelIVF']
  184. if mode not in allowedModes:
  185. print('Mode should be one of {}'.format(allowedModes))
  186. return []
  187. if mode=='PixelIVF':
  188. #4th parameter is sigma, not realizationId
  189. rCode='{:.2f}'.format(realizationId)
  190. rCode=re.sub('\.','p',rCode)
  191. else:
  192. #add one to match matlab 1..N array indexing
  193. rCode='{}'.format(realizationId+1)
  194. if len(mode)>0:
  195. mode=mode+'_'
  196. code=config.getCode(r,setup)
  197. fname='{}_{}_{}_{}fitParFinal.txt'.format(code,nclass,rCode,mode)
  198. locDir=config.getLocalDir(r,setup)
  199. uFile=os.path.join(locDir,fname)
  200. return numpy.genfromtxt(uFile,delimiter='\t')
  201. def getK1(fitPar,iclass):
  202. #fitGoodnes A tau alpha delay [k1 BVF k2 delay]xNcenters
  203. #0 to nclass-1 space
  204. return fitPar[4*iclass+5]
  205. def calculateK1(w,fitPar):
  206. #calculateK1 for region weights
  207. #return the k1 that belongs to the
  208. #maximum class in region (M) and
  209. #a weighted average (W)
  210. k1={region:{'M':0,'W':0} for region in w}
  211. for region in w:
  212. cmax=numpy.argmax(w[region])
  213. k1[region]['M']=getK1(fitPar,cmax)
  214. fs=0
  215. for c in numpy.arange(len(w[region])):
  216. fs+=w[region][c]*getK1(fitPar,c)
  217. k1[region]['W']=fs
  218. return k1
  219. def getPatientValuesByNclass(db,r,setup,nclass,nrealizations,sigma2,na):
  220. #summary script
  221. #db is for database; needs segmentations
  222. #r,setup identify patient
  223. #nclass and nrealizations select strategy
  224. #sigma2 is for combining output from adjacent pixels
  225. #na is neighborhood size where smoothing/combination is done
  226. k1={}
  227. for rId in numpy.arange(nrealizations):
  228. w=getWeights(db,r,setup,nclass,rId,sigma2,na)
  229. fitPar=getFitPar(r,setup,nclass,rId,'IVF')
  230. qk1=calculateK1(w,fitPar)
  231. for region in w:
  232. for type in qk1[region]:
  233. try:
  234. k1[region][type].append(qk1[region][type])
  235. except KeyError:
  236. k1={region:{type:[] for type in qk1[region]} for region in w}
  237. print(type)
  238. k1[region][type].append(qk1[region][type])
  239. print('[{}] {}/{}'.format(nclass,rId+1,nrealizations))
  240. return k1
  241. def getSummaryPatientValuesByNclass(db,r,setup,nclass,nrealizations,sigma2,na):
  242. #summary script, same arguments as above
  243. #also return deviation over realization
  244. k1=getPatientValuesByNclass(db,r,setup,nclass,nrealizations,sigma2,na)
  245. avgType=['M','W']
  246. summaryK1={type:{region:{
  247. 'mean':numpy.mean(k1[region][type]),
  248. 'std':numpy.std(k1[region][type]),
  249. 'median':numpy.median(k1[region][type])} for region in k1}
  250. for type in avgType}
  251. return summaryK1
  252. def fullSummary(db,setup,classes,nr,sigma2,na):
  253. rows=getData.getPatients(db,setup)
  254. return \
  255. {config.getCode(r,setup):\
  256. {c:getSummaryPatientValuesByNclass(db,r,setup,c,nr,sigma2,na) for c in classes} for r in rows}
  257. def storeSummary(db,setup,summary,sigma2,na):
  258. #dsM=db.selectRows(project,'study','Imaging',[])
  259. for rCode in summary:
  260. r=config.decode(rCode,setup)
  261. idFilter=config.getIdFilter(r,setup)
  262. visitFilter=config.getVisitFilter(r,setup)
  263. for c in summary[rCode]:
  264. cFilter={'variable':'nclass','value':str(c),'oper':'eq'}
  265. for t in summary[rCode][c]:
  266. tFilter={'variable':'option','value':t,'oper':'eq'}
  267. for rId in summary[rCode][c][t]:
  268. rFilter={'variable':'regionId','value':str(rId),'oper':'eq'}
  269. rows=getData.getSummary(db,setup,[idFilter,visitFilter,cFilter,tFilter,rFilter])
  270. if len(rows)>0:
  271. qrow=rows[0]
  272. mode='update'
  273. else:
  274. qrow={qr:r[qr] for qr in r}
  275. qrow['nclass']=c
  276. qrow['option']=t
  277. qrow['regionId']=rId
  278. seqNum=config.getTargetSeqNum(r,setup)
  279. qrow['SequenceNum']=100+seqNum+c+0.001*rId
  280. if t=='M':
  281. qrow['SequenceNum']+=0.0001
  282. mode='insert'
  283. for v in summary[rCode][c][t][rId]:
  284. qrow[v]=summary[rCode][c][t][rId][v]
  285. qrow['sigma2']=sigma2
  286. qrow['na']=na
  287. getData.updateSummary(db,setup,mode,[qrow])
  288. def summaryPixelIVF(db,fb,setup):
  289. #for second type of analysis (pixel based regions)
  290. qfilter=config.getFilter(setup)
  291. rows=getData.getPatients(db,setup,qfilter)
  292. sigma2=setup['sigma2']
  293. return \
  294. {config.getCode(r,setup):\
  295. {s2:getPixelIVF(db,fb,r,setup,s2) for s2 in sigma2} for r in rows}
  296. def storeIVF(db,setup,summary):
  297. for rCode in summary:
  298. r=config.decode(rCode,setup)
  299. idFilter=config.getIdFilter(r,setup)
  300. visitFilter=config.getVisitFilter(r,setup)
  301. for s2 in summary[rCode]:
  302. sigmaFilter={'variable':'sigma2','value':str(s2),'oper':'eq'}
  303. nr=len(summary[rCode][s2])
  304. for rId in summary[rCode][s2]:
  305. rFilter={'variable':'regionId','value':str(rId),'oper':'eq'}
  306. typeFilter={'variable':'option','value':'D','oper':'eq'}
  307. rows=getData.getSummary(db,setup,[idFilter,visitFilter,sigmaFilter,rFilter,typeFilter])
  308. if len(rows)>0:
  309. qrow=rows[0]
  310. mode='update'
  311. else:
  312. qrow={qr:r[qr] for qr in r}
  313. qrow['sigma2']=s2
  314. qrow['regionId']=rId
  315. seqNum=config.getTargetSeqNum(r,setup)
  316. qrow['SequenceNum']=140+seqNum+0.01*rId+0.001*s2
  317. mode='insert'
  318. qrow['mean']=summary[rCode][s2][rId]
  319. qrow['na']=7
  320. qrow['nclass']=nr
  321. qrow['option']='D'
  322. getData.updateSummary(db,setup,mode,[qrow])
  323. def getPixelIVF(db,fb,r,setup,sigma2):
  324. idFilter=config.getIdFilter(r,setup)
  325. visitFilter=config.getVisitFilter(r,setup)
  326. rows=getData.getSegmentation(db,setup,[idFilter,visitFilter])
  327. nclassIVF=len(rows)
  328. #x=segmentation.loadSegmentation(db,fb,r,setup)
  329. #nclassIVF=x.shape[0]
  330. #this assumes segmentation is loaded
  331. #nclassIVF=segmentation.getNC(r,setup)
  332. #fitPar=getFitPar(r,setup,nclassIVF,sigma2,'PixelIVF')
  333. fitPar=getPixelFitPar(fb,r,setup,nclassIVF,sigma2,'IVF')
  334. print(fitPar)
  335. k1={r['regionId']:getK1(fitPar,r['regionId']) for r in rows}
  336. return k1