c Energy funtion. c ERG is the energy of a loop closed by I,J (new numbering). c IP,JP is the other closing base-pair when MODE = 2 or 3. c c 1/2 Asym. loop correction c Extrapolate loops with dG(n)=dG(30)+1.75*ln(n/30) c Hairpins of 3 have no terminal stack. c function erg(mode,i,j,ip,jp) include 'rfd.inc' dimension e(4) integer*2 tlink,tlptr logical fce 100 if (mode.eq.1) then c Read energy files call ergread erg = 0 return endif erg = 0 c Do not allow prohibited bases to pair. if (force(i).eq.1.or.force(j).eq.1) then erg = infinity return endif if (mode.lt.6) then c Add bonus energy to force base-pairs. if (force(i).eq.2.or.force(j).eq.2.or.fce(i,j)) then erg = erg + eparam(9) if (force(i).eq.2.and.force(j).eq.2) erg = erg + eparam(9) endif endif goto (100,200,300,400,500,600,700),mode c Nucleotide accesssibility option. 200 if (force(i).eq.3.or.force(jp).eq.3) then erg = infinity return endif c Stacking energy. erg = erg + stack(numseq(i),numseq(j),numseq(ip),numseq(jp)) . + eparam(1) return 300 size1 = ip - i - 1 size2 = j - jp - 1 if (size1.eq.0.or.size2.eq.0) then c Check for nucleotide accessibility. if (size1.eq.0.and.force(i).eq.3) then erg = infinity return endif if (size2.eq.0.and.force(jp).eq.3) then erg = infinity return endif size = size1+size2 c Bulge loop. if (size.eq.1) then erg = erg + stack(numseq(i),numseq(j),numseq(ip),numseq(jp)) . + bulge(1) + eparam(2) else if (size.gt.30) then loginc = int(prelog*log((float(size)/30.0))) erg = erg + bulge(30) + loginc + eparam(2) else erg = erg + bulge(size) + eparam(2) endif return else size = size1+size2 lopsid = abs((size1-size2)) c Interior loop. if (size.gt.30) then loginc = int(prelog*log((float(size)/30.0))) erg = erg + tstk(numseq(i),numseq(j),numseq(i+1),numseq(j-1)) . + tstk(numseq(jp),numseq(ip),numseq(jp+1),numseq(ip-1)) . + inter(30) + loginc + eparam(3) . + min0(maxpen,(lopsid*poppen(min0(4,size1,size2)))) else erg = erg + tstk(numseq(i),numseq(j),numseq(i+1),numseq(j-1)) . + tstk(numseq(jp),numseq(ip),numseq(jp+1),numseq(ip-1)) . + inter(size) + eparam(3) . + min0(maxpen,(lopsid*poppen(min0(4,size1,size2)))) endif return endif 400 size = j-i-1 c Hairpin loop. if ((size.eq.3).and.fce(i,j).and.seq(hstnum(i+1)).eq.' ') then c Closed excision erg = eparam(9) return endif if (size.gt.30) then loginc = int(prelog*log((float(size)/30.0))) erg = erg + tstk(numseq(i),numseq(j),numseq(i+1),numseq(j-1)) . + hairpin(30) + loginc + eparam(4) else if (size.lt.4) then erg=erg+hairpin(size)+eparam(4) else c tlink=0 if (size.eq.4) then key=((numseq(i+4)*8+numseq(i+3))*8+numseq(i+2))*8+numseq(i+1) tlptr=1 do while ((tlptr.le.numoftloops).and.(tloop(tlptr,1).ne.key)) tlptr=tlptr+1 enddo if (tlptr.le.numoftloops) tlink=tloop(tlptr,2) endif erg = erg + tstk(numseq(i),numseq(j),numseq(i+1),numseq(j-1)) . + hairpin(size) + eparam(4) + tlink endif return c Multi-branch loop. 500 do 501 ii = 1,4 501 e(ii) = infinity if (i.le.n-2) then ind1 = (n-1)*i ind2 = (n-1)*(i+1) else if (i.eq.n-1) then ind1 = (n-1)*i ind2 = -n else ind1 = -n ind2 = -1 endif do k = i+2,j-3 c EPARAM(6) is the energy penalty for each single-stranded base c in a multi-loop. EPARAM(10) is the energy penalty for each base-pair c closing a multi-loop. c No dangling ends next to the I,J base-pair. e(1) = min0(e(1),wst(ind1+k)+work(k+1,mod(j-1,3))) c I+1 dangles on the I,J base-pair. e(2) = min0(e(2),dangle(numseq(i),numseq(j),numseq(i+1),1) . + wst(ind2+k) + work(k+1,mod(j-1,3)) + eparam(6)) c J-1 dangles on the I,J base-pair. e(3) = min0(e(3),dangle(numseq(i),numseq(j),numseq(j-1),2) . + wst(ind1+k) + work(k+1,mod(j-2,3)) + eparam(6)) c Both I+1 and J-1 dangle on the I,J base-pair. e(4) = min0(e(4),dangle(numseq(i),numseq(j),numseq(i+1),1) . + dangle(numseq(i),numseq(j),numseq(j-1),2) . + wst(ind2+k) + work(k+1,mod(j-2,3)) + 2*eparam(6)) enddo c EPARAM(5) is the energy penalty for closing a multi-loop. erg = erg + eparam(5) + eparam(10) + min0(e(1),e(2),e(3),e(4)) return c Dangling base stacking energy. IP dangles over the I,J c base-pair. 3' or 5' dangle if JP = 1 or 2 respectively. 600 erg = erg + dangle(numseq(i),numseq(j),numseq(ip),jp) return 700 if (force(i).eq.3.or.force(jp).eq.3) then erg = infinity return endif c Terminal stack or mismatch energy. erg = erg + tstk(numseq(i),numseq(j),numseq(ip),numseq(jp)) return end subroutine fill c This subroutine computes the arrays of optimal energies. include 'rfd.inc' dimension inc(5,5) data loop/3/,inc/0,0,0,1,0,0,0,1,0,0,0,1,0,1,0,1,0,1,0,0,0,0,0,0,0 ./ vmin = infinity if (n.le.80) then pinc = 5 elseif (n.le.100) then pinc = 2 else pinc = 1 endif pcnt = pinc crit = n*n*n/50 do j = 1,2*n-1 c How far along is the computation? if (n.gt.10) then if (j.le.n) then if (j**3.ge.pcnt*crit) then write (6,1000) pcnt pcnt = pcnt + pinc endif else if ((2*n-j)**3.le.(100-pcnt)*crit) then write (6,1000) pcnt pcnt = pcnt + pinc endif endif endif 1000 format ('+',5x,i4,'%') do i = min0(j,n),max0(1,j-n+1),-1 vij = infinity wij = infinity if (j-i.le.loop) goto 300 c Test for a prohibited base-pair or a pair which cannot form c a base-pair. if (vst((n-1)*(i-1)+j).eq.1.or.inc(numseq(i),numseq(j)).eq.0) . goto 200 c Compute VIJ, the minimum energy of the fragment from I to J c inclusive where I and J base-pair with one another. c Perhaps I,J closes a hairpin loop. vij = min0(vij,erg(4,i,j,i,j)) if (j-i-1.ge.loop+2) then c Perhaps I,J stacks over I+1,J-1. vij = min0(vij,erg(2,i,j,i+1,j-1)+v(i+1,j-1)) endif c Search for a bulge or interior loop. if (j-i-1.ge.loop+3) then do d = j-i-3,1,-1 do ip = i+1,j-1-d jp = d+ip if (j-i-2-d.gt.eparam(7)) goto 100 if (abs(ip-i+jp-j).le.eparam(8)) then if (ip.gt.n) then vij = min0(vij,erg(3,i,j,ip,jp)+vst((n-1)* . (ip-n-1)+jp-n)) else vij = min0(vij,erg(3,i,j,ip,jp)+vst((n-1)* . (ip-1)+jp)) endif endif enddo enddo endif 100 if (j-i-1.ge.2*loop+4) then c Perhaps I,J closes a multi-loop. vij=min0(vij,erg(5,i,j,i,j)) endif c Compute WIJ, the minimum energy of a non-empty folding on I to c J inclusive. This is the circular folding program and so there c are no exterior bases. 200 wij = min0 ( wij, eparam(10)+vij, v(i+1,j)+eparam(6)+eparam(10)+ . erg(6,j,i+1,i,2), v(i,j-1)+eparam(6)+eparam(10)+ . erg(6,j-1,i,j,1), v(i+1,j-1)+2*eparam(6)+eparam(10)+ . erg(6,j-1,i+1,i,2)+erg(6,j-1,i+1,j,1), . w(i+1,j)+eparam(6), w(i,j-1)+eparam(6) ) if (j-i-1.gt.2*loop+2) then index = (n-1)*(i-1) c Check for open bifurcation. do k = i,j-1 wij = min0(wij,wst(index+k)+work(k+1,mod(j,3))) enddo endif c Store VIJ and WIJ. They can be regarded as elements V(I,J) c and W(I,J) in a two dimensional array. They are actually c stored in the one dimensional arrays VST and WST in position c (N-1)*(I-1) + J. c Columns J,J-1 and J-2 of W are stored again in the WORK array. c This is done to reduce virtual memory swaps. 300 vst((n-1)*(i-1)+j) = vij wst((n-1)*(i-1)+j) = wij work(i,mod(j,3)) = wij if (j.gt.n) then c VMIN is the minimum folding energy of the entire sequence. c vmin = min0(vmin,vst((n-1)*(i-1)+j)+vst((n-1)*(j-n-1)+i)) vmin = min(vmin,vst((n-1)*(i-1)+j)+vst((n-1)*(j-n-1)+i)) endif enddo if (j.ge.n) then do k = j+1,n+1,-1 c Fill in some WORK array values before beginning work on the c next column. work(k,mod(j+1,3)) = wst((k-n-1)*(n-1)+j+1-n) enddo endif enddo return end c Used to recall values of V which are actually stored in VST. function v(i,j) include 'rfd.inc' if (i.gt.n) then v = vst((n-1)*(i-n-1)+j-n) else v = vst((n-1)*(i-1)+j) endif return end c Used to recall values of W which are actually stored in WST. function w(i,j) include 'rfd.inc' if (i.gt.n) then w = wst((n-1)*(i-n-1)+j-n) else w = wst((n-1)*(i-1)+j) endif return end c Computes an optimal structure on the subsequence II to JI where c II and JI must base-pair with one another. ERROR = 0 is normal c termination. c NFORCE is the number of forced base-pairs encountered in the traceback. subroutine trace(ii,ji,nforce,error) include 'rfd.inc' logical fce error = 0 c Zero the appropriate region of BASEPR. if (ji.le.n) then do k=ii,ji basepr(k) = 0 enddo else do k=1,ji-n basepr(k) = 0 enddo do k = ii,n basepr(k) = 0 enddo endif c Initialize the stack of outstanding base-pairs and push c II, JI and V(II,JI) on to the stack. The fourth stack position c is unused in this subroutine. call initst call push(ii,ji,v(ii,ji),0) nforce = 0 c Pull a fragment and its expected energy from the stack. c End if there are no fragments left. 100 stz = pull(i,j,e,xx) if (stz.ne.0) return c Do I and J base-pair with one another? if (e.eq.v(i,j)) goto 300 tst = w(i+1,j) + eparam(6) do while (e.eq.tst) c Whittle away from the 5' end. i = i + 1 if (i.ge.j) goto 100 e = w(i,j) tst = w(i+1,j) + eparam(6) enddo tst = w(i,j-1) + eparam(6) do while (e.eq.tst) c Whittle away from the 3' end. j = j - 1 if (i.ge.j) goto 100 e = w(i,j) tst = w(i,j-1) + eparam(6) enddo tst1 = v(i+1,j) + eparam(6) + eparam(10) + . dangle(numseq(j),numseq(i+1),numseq(i),2) tst2 = v(i,j-1) + eparam(6) + eparam(10) + . dangle(numseq(j-1),numseq(i),numseq(j),1) tst3 = v(i+1,j-1) + 2*eparam(6) + eparam(10) + . dangle(numseq(j-1),numseq(i+1),numseq(i),2) . + dangle(numseq(j-1),numseq(i+1),numseq(j),1) if (e.eq.tst1) then c I dangles over I+1,J. i = i + 1 e = v(i,j) else if (e.eq.tst2) then c J dangles over I,J-1. j = j - 1 e = v(i,j) else if (e.eq.tst3) then c Both I and J dangle over I+1,J-1. i = i + 1 j = j - 1 e = v(i,j) endif c Check for stem closing a multi-loop. if (e.eq.v(i,j)+eparam(10)) e = v(i,j) if (e.ne.v(i,j)) then c Cannot chop away at ends any more and still the ends do not c base-pair with one another. Structure MUST bifurcate (OPEN). k = i+1 200 if (k.eq.j) then c Structure will not split. Error ii = hstnum(i) ji = hstnum(j) error = 10 return endif if (e.eq.w(i,k) + w(k+1,j)) then c Best structure on I,J splits into best structures on I,K and c K+1,J. Push these fragments on to the stack. call push(i,k,w(i,k),0) call push(k+1,j,w(k+1,j),0) goto 100 else k = k + 1 goto 200 endif endif c Base-pair found. Base-pairs are stored in the range 1 <= I < J <= N. 300 if (j.le.n) then basepr(i) = j basepr(j) = i else if (i.gt.n) then basepr(i-n) = j-n basepr(j-n) = i-n i = i - n j = j - n else basepr(j-n) = i basepr(i) = j-n endif c Check if this is a forced base-pair. if (force(i).eq.2.or.force(j).eq.2.or.fce(i,j)) . nforce = nforce + 1 if (force(i).eq.2.and.force(j).eq.2) nforce = nforce + 1 c Perhaps I,J stacks over I+1,J-1? if (e.eq.erg(2,i,j,i+1,j-1) . + v(i+1,j-1)) then i = i + 1 j = j - 1 e = v(i,j) goto 300 endif c Perhaps I,J closes a hairpin loop? if (e.eq.erg(4,i,j,i,j)) goto 100 c Define E' ( EP in the program ) to be E corrected by a c possible bonus energy for forced base-pairing. c ep = e if (force(i).eq.2.or.force(j).eq.2.or.fce(i,j)) . ep = ep - eparam(9) if (force(i).eq.2.and.force(j).eq.2) ep = ep - eparam(9) k = i+2 c Perhaps I,J closes a multi-loop? 400 if (k.ge.j-3) goto 500 if (ep.eq.w(i+1,k) + w(k+1,j-1) + eparam(10) + eparam(5)) then c Multi-loop. No dangling ends on I,J. call push(i+1,k,w(i+1,k),0) call push(k+1,j-1,w(k+1,j-1),0) goto 100 else if (ep.eq.erg(6,i,j,i+1,1)+w(i+2,k)+w(k+1,j-1)+eparam(10)+ . eparam(6)+eparam(5)) then c Multi-loop. I+1 dangles over I,J base-pair. call push(i+2,k,w(i+2,k),0) call push(k+1,j-1,w(k+1,j-1),0) goto 100 else if (ep.eq.erg(6,i,j,j-1,2)+w(i+1,k)+w(k+1,j-2)+eparam(10)+ . eparam(6)+eparam(5)) then c Multi-loop. J-1 dangles over I,J base-pair. call push(i+1,k,w(i+1,k),0) call push(k+1,j-2,w(k+1,j-2),0) goto 100 else if (ep.eq.erg(6,i,j,i+1,1)+erg(6,i,j,j-1,2)+w(i+2,k) . +w(k+1,j-2)+ eparam(10)+2*eparam(6)+eparam(5)) then c Multi-loop. Both I+1 and J-1 dangle over the I,J base-pair. call push(i+2,k,w(i+2,k),0) call push(k+1,j-2,w(k+1,j-2),0) goto 100 else k = k + 1 goto 400 endif c None of the above work. I,J MUST close a bulge or interior loop. 500 do d = j-i-3,1,-1 do ip = i+1,j-1-d jp = d+ip if (j-i-2-d.gt.eparam(7)) then c Error, bulge or interior loop not found. ii = hstnum(i) ji = hstnum(j) error = 11 return endif if (abs(ip-i+jp-j).le.eparam(8)) then if (e.eq.erg(3,i,j,ip,jp)+v(ip,jp)) then i = ip j = jp e = v(i,j) goto 300 endif endif enddo enddo c Error, bulge or interior loop not found. ii = hstnum(i) ji = hstnum(j) error = 11 return end c Store results of a SAVE run for a CONTINUATION run. subroutine putcont include 'rfd.inc' write(30) n,nsave,vmin,listsz,seqlab write(30) stack,tstk,dangle,hairpin,bulge,inter,eparam write(30) (vst(i),i=1,n*n) write(30) (wst(i),i=1,n*n) write(30) (seq(i),i=nsave(1),nsave(2)) write(30) ((list(i,j),i=1,100),j=1,4) write(30) tloop,numoftloops write(30) (poppen(i),i=1,4),maxpen,prelog return end c Read results of a SAVE run for a CONTINUATION run. subroutine getcont include 'rfd.inc' read(30,end=10) n,nsave,vmin,listsz,seqlab read(30,end=10) stack,tstk,dangle,hairpin,bulge,inter,eparam read(30,end=10) (vst(i),i=1,n*n) read(30,end=10) (wst(i),i=1,n*n) read(30,end=10) (seq(i),i=nsave(1),nsave(2)) read(30,end=10) ((list(i,j),i=1,100),j=1,4) read(30,err=10) tloop,numoftloops read(30,err=10) (poppen(i),i=1,4),maxpen,prelog goto 11 10 call errmsg(40,0,0) 11 return end