diff --git a/biology/py-crossmap/Makefile b/biology/py-crossmap/Makefile
index a5a3746a31c4..ddee1a5a1fa7 100644
--- a/biology/py-crossmap/Makefile
+++ b/biology/py-crossmap/Makefile
@@ -1,26 +1,24 @@
 PORTNAME=	crossmap
-DISTVERSION=	0.5.4
-PORTREVISION=	1
+DISTVERSION=	0.7.3
 CATEGORIES=	biology python
 MASTER_SITES=	PYPI
 PKGNAMEPREFIX=	${PYTHON_PKGNAMEPREFIX}
-DISTNAME=	CrossMap-${DISTVERSION}
 
 MAINTAINER=	jwb@FreeBSD.org
 COMMENT=	Lift over genomics coordinates between assemblies
-WWW=		https://pypi.python.org/pypi/crossmap
+WWW=		https://github.com/liguowang/CrossMap
 
-LICENSE=	GPLv2
+LICENSE=	GPLv3+
 LICENSE_FILE=	${WRKSRC}/LICENSE.txt
 
 BUILD_DEPENDS=	${PYTHON_PKGNAMEPREFIX}nose>0.10.4:devel/py-nose@${PY_FLAVOR}
 RUN_DEPENDS=	${PYTHON_PKGNAMEPREFIX}pysam>0:biology/py-pysam@${PY_FLAVOR} \
 		${PYTHON_PKGNAMEPREFIX}bx-python>0:biology/py-bx-python@${PY_FLAVOR} \
 		${PYTHON_PKGNAMEPREFIX}pyBigWig>0:biology/py-pybigwig@${PY_FLAVOR}
 
 USES=		python
 USE_PYTHON=	autoplist concurrent cython distutils
 
 NO_ARCH=	yes
 
 .include <bsd.port.mk>
diff --git a/biology/py-crossmap/distinfo b/biology/py-crossmap/distinfo
index 1dabfc731aef..f35df2d53427 100644
--- a/biology/py-crossmap/distinfo
+++ b/biology/py-crossmap/distinfo
@@ -1,3 +1,3 @@
-TIMESTAMP = 1618936542
-SHA256 (CrossMap-0.5.4.tar.gz) = 3419a5bf422754c3acb1e59ec9bba1a6c9a19d3673e962ae832e429ef0f768e5
-SIZE (CrossMap-0.5.4.tar.gz) = 9511082
+TIMESTAMP = 1740057259
+SHA256 (crossmap-0.7.3.tar.gz) = c5793d1bbfea962b3f21d8cd9830a79a169b3a3ec6461555d819be125b391f6d
+SIZE (crossmap-0.7.3.tar.gz) = 33325
diff --git a/biology/py-crossmap/files/patch-2to3 b/biology/py-crossmap/files/patch-2to3
deleted file mode 100644
index c3b680224b43..000000000000
--- a/biology/py-crossmap/files/patch-2to3
+++ /dev/null
@@ -1,2955 +0,0 @@
---- lib/cmmodule/SAM.py.orig	2018-12-17 16:05:26 UTC
-+++ lib/cmmodule/SAM.py
-@@ -150,52 +150,52 @@ class ParseSAM:
- 					forward_SE +=1
- 				
- 		if paired:				
--			print >>sys.stderr,"\n#=================================================="
--			print >>sys.stderr,"#================Report (pair-end)================="
--			print >>sys.stderr, "%-25s%d" % ("Total Reads:",total_read)
--			print >>sys.stderr, "%-25s%d" % ("Total Mapped Reads:", (mapped_read1 + mapped_read2))
--			print >>sys.stderr, "%-25s%d" % ("Total Unmapped Reads:",(unmapped_read1 + unmapped_read2))
--			print >>sys.stderr, "%-25s%d" % ("PCR duplicate:",pcr_duplicate)
--			print >>sys.stderr, "%-25s%d" % ("QC-failed:",low_qual)
--			print >>sys.stderr, "%-25s%d" % ("Not primary mapping:",secondary_hit)
--			print >>sys.stderr, "\n",
--			print >>sys.stderr, "%-25s%d" % ("Unmapped Read-1:",unmapped_read1)
--			print >>sys.stderr, "%-25s%d" % ("Mapped Read-1:",mapped_read1)
--			print >>sys.stderr, "%-25s%d" % ("  Forward (+):",forward_read1)
--			print >>sys.stderr, "%-25s%d" % ("  Reverse (-):",reverse_read1)
-+			print("\n#==================================================", file=sys.stderr)
-+			print("#================Report (pair-end)=================", file=sys.stderr)
-+			print("%-25s%d" % ("Total Reads:",total_read), file=sys.stderr)
-+			print("%-25s%d" % ("Total Mapped Reads:", (mapped_read1 + mapped_read2)), file=sys.stderr)
-+			print("%-25s%d" % ("Total Unmapped Reads:",(unmapped_read1 + unmapped_read2)), file=sys.stderr)
-+			print("%-25s%d" % ("PCR duplicate:",pcr_duplicate), file=sys.stderr)
-+			print("%-25s%d" % ("QC-failed:",low_qual), file=sys.stderr)
-+			print("%-25s%d" % ("Not primary mapping:",secondary_hit), file=sys.stderr)
-+			print("\n", end=' ', file=sys.stderr)
-+			print("%-25s%d" % ("Unmapped Read-1:",unmapped_read1), file=sys.stderr)
-+			print("%-25s%d" % ("Mapped Read-1:",mapped_read1), file=sys.stderr)
-+			print("%-25s%d" % ("  Forward (+):",forward_read1), file=sys.stderr)
-+			print("%-25s%d" % ("  Reverse (-):",reverse_read1), file=sys.stderr)
- 			
--			print >>sys.stderr, "\n",
--			print >>sys.stderr, "%-25s%d" % ("Unmapped Read-2:",unmapped_read2)
--			print >>sys.stderr, "%-25s%d" % ("Mapped Read-2:",mapped_read2)
--			print >>sys.stderr, "%-25s%d" % ("  Forward (+):",forward_read2)
--			print >>sys.stderr, "%-25s%d" % ("  Reverse (-):",reverse_read2)
-+			print("\n", end=' ', file=sys.stderr)
-+			print("%-25s%d" % ("Unmapped Read-2:",unmapped_read2), file=sys.stderr)
-+			print("%-25s%d" % ("Mapped Read-2:",mapped_read2), file=sys.stderr)
-+			print("%-25s%d" % ("  Forward (+):",forward_read2), file=sys.stderr)
-+			print("%-25s%d" % ("  Reverse (-):",reverse_read2), file=sys.stderr)
- 			
--			print >>sys.stderr, "\n",
--			print >>sys.stderr, "%-25s%d" % ("Mapped to (+/-):",plus_minus)
--			print >>sys.stderr, "%-25s%d" % ("Mapped to (-/+):",minus_plus)
--			print >>sys.stderr, "%-25s%d" % ("Mapped to (+/+):",plus_plus)
--			print >>sys.stderr, "%-25s%d" % ("Mapped to (-/-):",minus_minus)
--			print >>sys.stderr, "\n",
--			print >>sys.stderr, "%-25s%d" % ("Spliced Hits:",_numSplitHit)
--			print >>sys.stderr, "%-25s%d" % ("Non-spliced Hits:",_numMonoHit)
--			print >>sys.stderr, "%-25s%d" % ("Reads have insertion:",_numInsertion)
--			print >>sys.stderr, "%-25s%d" % ("Reads have deletion:",_numDeletion)
-+			print("\n", end=' ', file=sys.stderr)
-+			print("%-25s%d" % ("Mapped to (+/-):",plus_minus), file=sys.stderr)
-+			print("%-25s%d" % ("Mapped to (-/+):",minus_plus), file=sys.stderr)
-+			print("%-25s%d" % ("Mapped to (+/+):",plus_plus), file=sys.stderr)
-+			print("%-25s%d" % ("Mapped to (-/-):",minus_minus), file=sys.stderr)
-+			print("\n", end=' ', file=sys.stderr)
-+			print("%-25s%d" % ("Spliced Hits:",_numSplitHit), file=sys.stderr)
-+			print("%-25s%d" % ("Non-spliced Hits:",_numMonoHit), file=sys.stderr)
-+			print("%-25s%d" % ("Reads have insertion:",_numInsertion), file=sys.stderr)
-+			print("%-25s%d" % ("Reads have deletion:",_numDeletion), file=sys.stderr)
- 		else:
--			print >>sys.stderr,"\n#===================================================="
--			print >>sys.stderr,"#================Report (single-end)================="
--			print >>sys.stderr, "%-25s%d" % ("Total Reads:",total_read)
--			print >>sys.stderr, "%-25s%d" % ("Total Mapped Reads:", map_SE)
--			print >>sys.stderr, "%-25s%d" % ("Total Unmapped Reads:",unmap_SE)
--			print >>sys.stderr, "%-25s%d" % ("PCR duplicate:",pcr_duplicate)
--			print >>sys.stderr, "%-25s%d" % ("QC-failed:",low_qual)
--			print >>sys.stderr, "%-25s%d" % ("Not primary mapping:",secondary_hit)
--			print >>sys.stderr, "%-25s%d" % ("froward (+):",forward_SE)
--			print >>sys.stderr, "%-25s%d" % ("reverse (-):",reverse_SE)
--			print >>sys.stderr, "\n",
--			print >>sys.stderr, "%-25s%d" % ("Spliced Hits:",_numSplitHit)
--			print >>sys.stderr, "%-25s%d" % ("Non-spliced Hits:",_numMonoHit)
--			print >>sys.stderr, "%-25s%d" % ("Reads have insertion:",_numInsertion)
--			print >>sys.stderr, "%-25s%d" % ("Reads have deletion:",_numDeletion)			
-+			print("\n#====================================================", file=sys.stderr)
-+			print("#================Report (single-end)=================", file=sys.stderr)
-+			print("%-25s%d" % ("Total Reads:",total_read), file=sys.stderr)
-+			print("%-25s%d" % ("Total Mapped Reads:", map_SE), file=sys.stderr)
-+			print("%-25s%d" % ("Total Unmapped Reads:",unmap_SE), file=sys.stderr)
-+			print("%-25s%d" % ("PCR duplicate:",pcr_duplicate), file=sys.stderr)
-+			print("%-25s%d" % ("QC-failed:",low_qual), file=sys.stderr)
-+			print("%-25s%d" % ("Not primary mapping:",secondary_hit), file=sys.stderr)
-+			print("%-25s%d" % ("froward (+):",forward_SE), file=sys.stderr)
-+			print("%-25s%d" % ("reverse (-):",reverse_SE), file=sys.stderr)
-+			print("\n", end=' ', file=sys.stderr)
-+			print("%-25s%d" % ("Spliced Hits:",_numSplitHit), file=sys.stderr)
-+			print("%-25s%d" % ("Non-spliced Hits:",_numMonoHit), file=sys.stderr)
-+			print("%-25s%d" % ("Reads have insertion:",_numInsertion), file=sys.stderr)
-+			print("%-25s%d" % ("Reads have deletion:",_numDeletion), file=sys.stderr)			
- 			
- 	def samTobed(self,outfile=None,mergePE=False):
- 		"""Convert SAM file to BED file. BED file will be saved as xxx.sam.bed unless otherwise specified.
-@@ -204,7 +204,7 @@ class ParseSAM:
- 		if outfile is None:
- 			outfile=self.fileName + ".bed"
- 
--		print >>sys.stderr,"\tWriting bed entries to\"",outfile,"\"...",
-+		print("\tWriting bed entries to\"",outfile,"\"...", end=' ', file=sys.stderr)
- 		FO=open(outfile,'w')
- 		for line in self.f:
- 			if line.startswith(('@','track')):continue		#skip head lines
-@@ -240,14 +240,14 @@ class ParseSAM:
- 			for i in range(0,len(comb),2):
- 				blockStart.append(str(sum(comb[:i])))
- 			blockStarts = ','.join(blockStart)
--			print >>FO, string.join((str(i) for i in [chrom,chromStart,chromEnd,name,score,strand,thickStart,thickEnd,itemRgb,blockCount,blockSizes,blockStarts]),sep="\t")			
--		print >>sys.stderr, "Done"
-+			print(string.join((str(i) for i in [chrom,chromStart,chromEnd,name,score,strand,thickStart,thickEnd,itemRgb,blockCount,blockSizes,blockStarts]),sep="\t"), file=FO)			
-+		print("Done", file=sys.stderr)
- 		FO.close()
- 		self.f.seek(0)
- 
- 		if mergePE:
- 		#creat another bed file. pair-end reads will be merged into single bed entry
--			print >>sys.stderr, "Writing consoidated bed file ...",
-+			print("Writing consoidated bed file ...", end=' ', file=sys.stderr)
- 			bedfile = open(outfile,'r')
- 			outfile_2 = outfile + ".consolidate.bed"
- 			outfile_3 = outfile + '.filter'
-@@ -292,11 +292,11 @@ class ParseSAM:
- 					if(blocks[key] ==1):	#single end, single hit
- 						st = [i - txSt[key] for i in starts[key]]
- 						st = string.join([str(i) for i in st],',')
--						print >>FO, chr[key].pop(),"\t",txSt[key],"\t",txEnd[key],"\t",key,"\t","11\t",strand[key][0],"\t",txSt[key],"\t",txEnd[key],"\t","0,255,0\t",blocks[key],"\t",string.join(sizes[key],','),"\t",st
-+						print(chr[key].pop(),"\t",txSt[key],"\t",txEnd[key],"\t",key,"\t","11\t",strand[key][0],"\t",txSt[key],"\t",txEnd[key],"\t","0,255,0\t",blocks[key],"\t",string.join(sizes[key],','),"\t",st, file=FO)
- 					else:
- 						st = [i - txSt[key] for i in starts[key]]	#single end, spliced hit
- 						st = string.join([str(i) for i in st],',')
--						print >>FO, chr[key].pop(),"\t",txSt[key],"\t",txEnd[key],"\t",key,"\t","12\t",strand[key][0],"\t",txSt[key],"\t",txEnd[key],"\t","0,255,0\t",blocks[key],"\t",string.join(sizes[key],','),"\t",st						
-+						print(chr[key].pop(),"\t",txSt[key],"\t",txEnd[key],"\t",key,"\t","12\t",strand[key][0],"\t",txSt[key],"\t",txEnd[key],"\t","0,255,0\t",blocks[key],"\t",string.join(sizes[key],','),"\t",st, file=FO)						
- 								
- 				elif(count[key]==2):	#pair-end read
- 					direction = string.join(strand[key],'/')	
-@@ -306,17 +306,17 @@ class ParseSAM:
- 					#st=[string.atoi(i) for i in st]
- 					if(len(chr[key])==1):	#pair-end reads mapped to same chromosome
- 						if blocks[key] ==2:	#pair end, single hits
--							print >>FO, chr[key].pop(),"\t",txSt[key],"\t",txEnd[key],"\t",key + "|strand=" + direction + "|chrom=same","\t","21\t",'.',"\t",txSt[key],"\t",txEnd[key],"\t","0,255,0\t",blocks[key],"\t",string.join(sz,','),"\t",string.join([str(i) for i in st],',')
-+							print(chr[key].pop(),"\t",txSt[key],"\t",txEnd[key],"\t",key + "|strand=" + direction + "|chrom=same","\t","21\t",'.',"\t",txSt[key],"\t",txEnd[key],"\t","0,255,0\t",blocks[key],"\t",string.join(sz,','),"\t",string.join([str(i) for i in st],','), file=FO)
- 						elif blocks[key] >2:	#
--							print >>FO, chr[key].pop(),"\t",txSt[key],"\t",txEnd[key],"\t",key + "|strand=" + direction + "|chrom=same","\t","22\t",'.',"\t",txSt[key],"\t",txEnd[key],"\t","0,255,0\t",blocks[key],"\t",string.join(sz,','),"\t",string.join([str(i) for i in st],',')
-+							print(chr[key].pop(),"\t",txSt[key],"\t",txEnd[key],"\t",key + "|strand=" + direction + "|chrom=same","\t","22\t",'.',"\t",txSt[key],"\t",txEnd[key],"\t","0,255,0\t",blocks[key],"\t",string.join(sz,','),"\t",string.join([str(i) for i in st],','), file=FO)
- 					else:
--						print >>FOF,key,"\t","pair-end mapped, but two ends mapped to different chromosome"
-+						print(key,"\t","pair-end mapped, but two ends mapped to different chromosome", file=FOF)
- 				elif(count[key] >2):	#reads occur more than 2 times
--					print >>FOF,key,"\t","occurs more than 2 times in sam file"
-+					print(key,"\t","occurs more than 2 times in sam file", file=FOF)
- 					continue
- 			FO.close()
- 			FOF.close()
--			print >>sys.stderr, "Done"
-+			print("Done", file=sys.stderr)
- 
- 
- 	def samTowig(self,outfile=None,log2scale=False,header=False,strandSpecific=False):
-@@ -326,7 +326,7 @@ class ParseSAM:
- 		if outfile is None:
- 			outfile = self.fileName + ".wig"
- 		FO=open(outfile,'w')
--		print >>sys.stderr, "Writing wig file to\"",outfile,"\"..."
-+		print("Writing wig file to\"",outfile,"\"...", file=sys.stderr)
- 		
- 		headline="track type=wiggle_0 name=" + outfile + " track_label description='' visibility=full color=255,0,0"
- 		wig=collections.defaultdict(dict)
-@@ -359,24 +359,24 @@ class ParseSAM:
- 			
- 			blocks = cigar.fetch_exon(chrom,txStart,field[5])	
- 			for block in blocks:
--				hits.extend(range(block[1]+1,block[2]+1))
-+				hits.extend(list(range(block[1]+1,block[2]+1)))
- 				
- 			if strandSpecific is not True:
- 				for i in hits:
--					if wig[chrom].has_key(i):
-+					if i in wig[chrom]:
- 						wig[chrom][i] +=1
- 					else:
- 						wig[chrom][i]=1
- 			else:
- 				if strand_rule[read_type + strand] == '-':
- 					for i in hits:
--						if Nwig[chrom].has_key(i):
-+						if i in Nwig[chrom]:
- 							Nwig[chrom][i] += 1
- 						else:
- 							Nwig[chrom][i] = 1
- 				if strand_rule[read_type + strand] == '+':
- 					for i in hits:
--						if Pwig[chrom].has_key(i):
-+						if i in Pwig[chrom]:
- 							Pwig[chrom][i] +=1
- 						else:
- 							Pwig[chrom][i]=1					
-@@ -385,17 +385,17 @@ class ParseSAM:
- 		
- 		if strandSpecific is not True:
- 			for chr in sorted(wig.keys()):
--				print >>sys.stderr, "Writing ",chr, " ..."
-+				print("Writing ",chr, " ...", file=sys.stderr)
- 				FO.write('variableStep chrom='+chr+'\n')
- 				for coord in sorted(wig[chr]):
- 					if log2scale:FO.write("%d\t%5.3f\n" % (coord,math.log(wig[chr][coord],2)))
- 					else:FO.write("%d\t%d\n" % (coord,wig[chr][coord]))
- 		else:
--			chroms=set(Pwig.keys() + Nwig.keys())
-+			chroms=set(list(Pwig.keys()) + list(Nwig.keys()))
- 			for chr in sorted(chroms):
--				print >>sys.stderr, "Writing ",chr, " ..."
-+				print("Writing ",chr, " ...", file=sys.stderr)
- 				FO.write('variableStep chrom='+chr+'\n')
--				coords=sorted(set(Pwig[chr].keys() + Nwig[chr].keys()))
-+				coords=sorted(set(list(Pwig[chr].keys()) + list(Nwig[chr].keys())))
- 				for coord in coords:
- 					if ((coord in Pwig[chr]) and (coord not in Nwig[chr])):
- 						FO.write("%d\t%d\n" % (coord,Pwig[chr][coord]))
-@@ -418,7 +418,7 @@ class ParseSAM:
- 			else: outfile = self.fileName + ".unmap.fa"
- 		FO=open(outfile,'w')
- 		unmapCount=0
--		print >>sys.stderr, "Writing unmapped reads to\"",outfile,"\"... ",
-+		print("Writing unmapped reads to\"",outfile,"\"... ", end=' ', file=sys.stderr)
- 		
- 		for line in self.f:
- 			hits=[]
-@@ -438,7 +438,7 @@ class ParseSAM:
- 				if fastq: FO.write('@' + seqID + '\n' + seq +'\n' + '+' +'\n' + qual+'\n')
- 				else: FO.write('>' + seqID + '\n' + seq +'\n')
- 
--		print >>sys.stderr, str(unmapCount) + " reads saved!\n"
-+		print(str(unmapCount) + " reads saved!\n", file=sys.stderr)
- 		FO.close()
- 		self.f.seek(0)
- 	
-@@ -449,7 +449,7 @@ class ParseSAM:
- 			outfile = self.fileName + ".PP.sam"
- 		FO=open(outfile,'w')
- 		PPcount=0
--		print >>sys.stderr, "Writing proper paired reads to\"",outfile,"\"... ",
-+		print("Writing proper paired reads to\"",outfile,"\"... ", end=' ', file=sys.stderr)
- 		for line in self.f:
- 			hits=[]
- 			if line[0] == '@':continue						#skip head lines	
-@@ -460,7 +460,7 @@ class ParseSAM:
- 				PPcount +=1
- 				FO.write(line)
- 		FO.close()
--		print >>sys.stderr, str(PPcount) + " reads were saved!\n",
-+		print(str(PPcount) + " reads were saved!\n", end=' ', file=sys.stderr)
- 		self.f.seek(0)
- 
- 	def samNVC(self,outfile=None):
-@@ -481,7 +481,7 @@ class ParseSAM:
- 		c_count=[]
- 		g_count=[]
- 		t_count=[]
--		print >>sys.stderr, "reading sam file ... "
-+		print("reading sam file ... ", file=sys.stderr)
- 		for line in self.f:
- 			if line.startswith('@'):continue									#skip head lines	
- 			if ParseSAM._reExpr2.match(line):continue					#skip blank lines
-@@ -492,44 +492,44 @@ class ParseSAM:
- 				RNA_read = field[9].upper()
- 			else:
- 				RNA_read = field[9].upper().translate(transtab)[::-1]
--			for i in xrange(len(RNA_read)):
-+			for i in range(len(RNA_read)):
- 				key = str(i) + RNA_read[i]
- 				base_freq[key] += 1
- 		
--		print >>sys.stderr, "generating data matrix ..."
--		print >>FO, "Position\tA\tC\tG\tT\tN\tX"
--		for i in xrange(len(RNA_read)):
--			print  >>FO, str(i) + '\t',
--			print  >>FO, str(base_freq[str(i) + "A"]) + '\t',
-+		print("generating data matrix ...", file=sys.stderr)
-+		print("Position\tA\tC\tG\tT\tN\tX", file=FO)
-+		for i in range(len(RNA_read)):
-+			print(str(i) + '\t', end=' ', file=FO)
-+			print(str(base_freq[str(i) + "A"]) + '\t', end=' ', file=FO)
- 			a_count.append(str(base_freq[str(i) + "A"]))
--			print  >>FO, str(base_freq[str(i) + "C"]) + '\t',
-+			print(str(base_freq[str(i) + "C"]) + '\t', end=' ', file=FO)
- 			c_count.append(str(base_freq[str(i) + "C"]))
--			print  >>FO, str(base_freq[str(i) + "G"]) + '\t',
-+			print(str(base_freq[str(i) + "G"]) + '\t', end=' ', file=FO)
- 			g_count.append(str(base_freq[str(i) + "G"]))
--			print  >>FO, str(base_freq[str(i) + "T"]) + '\t',
-+			print(str(base_freq[str(i) + "T"]) + '\t', end=' ', file=FO)
- 			t_count.append(str(base_freq[str(i) + "T"]))
--			print  >>FO, str(base_freq[str(i) + "N"]) + '\t',
--			print  >>FO, str(base_freq[str(i) + "X"]) + '\t'
-+			print(str(base_freq[str(i) + "N"]) + '\t', end=' ', file=FO)
-+			print(str(base_freq[str(i) + "X"]) + '\t', file=FO)
- 		FO.close()
- 		
- 		#generating R scripts
--		print >>sys.stderr, "generating R script  ..."
--		print >>RS, "position=c(" + ','.join([str(i) for i in xrange(len(RNA_read))]) + ')'
--		print >>RS, "A_count=c(" + ','.join(a_count) + ')'
--		print >>RS, "C_count=c(" + ','.join(c_count) + ')'
--		print >>RS, "G_count=c(" + ','.join(g_count) + ')'
--		print >>RS, "T_count=c(" + ','.join(t_count) + ')'
--		print >>RS, "total= A_count + C_count + G_count + T_count"
--		print >>RS, "ym=max(A_count/total,C_count/total,G_count/total,T_count/total) + 0.05"
--		print >>RS, "yn=min(A_count/total,C_count/total,G_count/total,T_count/total)"
-+		print("generating R script  ...", file=sys.stderr)
-+		print("position=c(" + ','.join([str(i) for i in range(len(RNA_read))]) + ')', file=RS)
-+		print("A_count=c(" + ','.join(a_count) + ')', file=RS)
-+		print("C_count=c(" + ','.join(c_count) + ')', file=RS)
-+		print("G_count=c(" + ','.join(g_count) + ')', file=RS)
-+		print("T_count=c(" + ','.join(t_count) + ')', file=RS)
-+		print("total= A_count + C_count + G_count + T_count", file=RS)
-+		print("ym=max(A_count/total,C_count/total,G_count/total,T_count/total) + 0.05", file=RS)
-+		print("yn=min(A_count/total,C_count/total,G_count/total,T_count/total)", file=RS)
- 		
--		print >>RS, 'pdf("NVC_plot.pdf")'
--		print >>RS, 'plot(position,A_count/total,type="o",pch=20,ylim=c(yn,ym),col="dark green",xlab="Position of Read",ylab="Nucleotide Frequency")'
--		print >>RS, 'lines(position,T_count/total,type="o",pch=20,col="red")'
--		print >>RS, 'lines(position,G_count/total,type="o",pch=20,col="blue")'
--		print >>RS, 'lines(position,C_count/total,type="o",pch=20,col="cyan")'
--		print >>RS, 'legend('+ str(len(RNA_read)-10) + ',ym,legend=c("A","T","G","C"),col=c("dark green","red","blue","cyan"),lwd=2,pch=20,text.col=c("dark green","red","blue","cyan"))'
--		print >>RS, "dev.off()"
-+		print('pdf("NVC_plot.pdf")', file=RS)
-+		print('plot(position,A_count/total,type="o",pch=20,ylim=c(yn,ym),col="dark green",xlab="Position of Read",ylab="Nucleotide Frequency")', file=RS)
-+		print('lines(position,T_count/total,type="o",pch=20,col="red")', file=RS)
-+		print('lines(position,G_count/total,type="o",pch=20,col="blue")', file=RS)
-+		print('lines(position,C_count/total,type="o",pch=20,col="cyan")', file=RS)
-+		print('legend('+ str(len(RNA_read)-10) + ',ym,legend=c("A","T","G","C"),col=c("dark green","red","blue","cyan"),lwd=2,pch=20,text.col=c("dark green","red","blue","cyan"))', file=RS)
-+		print("dev.off()", file=RS)
- 		
- 		RS.close()
- 		#self.f.seek(0)
-@@ -546,7 +546,7 @@ class ParseSAM:
- 		RS=open(outfile2,'w')
- 		
- 		gc_hist=collections.defaultdict(int)	#key is GC percent, value is count of reads
--		print >>sys.stderr, "reading sam file ... "
-+		print("reading sam file ... ", file=sys.stderr)
- 		for line in self.f:
- 			if line[0] == '@':continue						#skip head lines	
- 			if ParseSAM._reExpr2.match(line):continue		#skip blank lines
-@@ -556,18 +556,18 @@ class ParseSAM:
- 			#print gc_percent
- 			gc_hist[gc_percent] += 1
- 		
--		print >>sys.stderr, "writing GC content ..."
-+		print("writing GC content ...", file=sys.stderr)
- 		
--		print >>FO, "GC%\tread_count"
--		for i in gc_hist.keys():
--			print >>FO, i + '\t' + str(gc_hist[i])
-+		print("GC%\tread_count", file=FO)
-+		for i in list(gc_hist.keys()):
-+			print(i + '\t' + str(gc_hist[i]), file=FO)
- 			
--		print >>sys.stderr, "writing R script ..."
--		print >>RS, "pdf('GC_content.pdf')"
--		print >>RS, 'gc=rep(c(' + ','.join([i for i in gc_hist.keys()]) + '),' + 'times=c(' + ','.join([str(i) for i in gc_hist.values()]) + '))'
--		print >>RS, 'hist(gc,probability=T,breaks=%d,xlab="GC content (%%)",ylab="Density of Reads",border="blue",main="")' % 100
-+		print("writing R script ...", file=sys.stderr)
-+		print("pdf('GC_content.pdf')", file=RS)
-+		print('gc=rep(c(' + ','.join([i for i in list(gc_hist.keys())]) + '),' + 'times=c(' + ','.join([str(i) for i in list(gc_hist.values())]) + '))', file=RS)
-+		print('hist(gc,probability=T,breaks=%d,xlab="GC content (%%)",ylab="Density of Reads",border="blue",main="")' % 100, file=RS)
- 		#print >>RS, "lines(density(gc),col='red')"
--		print >>RS ,"dev.off()"		
-+		print("dev.off()", file=RS)		
- 		#self.f.seek(0)
- 		
- 	def samDupRate(self,outfile=None,up_bound=500):
-@@ -589,7 +589,7 @@ class ParseSAM:
- 		
- 		seqDup_count=collections.defaultdict(int)
- 		posDup_count=collections.defaultdict(int)
--		print >>sys.stderr, "reading sam file ... "
-+		print("reading sam file ... ", file=sys.stderr)
- 		for line in self.f:
- 			if line[0] == '@':continue						#skip head lines	
- 			if ParseSAM._reExpr2.match(line):continue		#skip blank lines
-@@ -616,37 +616,37 @@ class ParseSAM:
- 			coord = chrom + ":" + str(chromStart) + "-" + str(chromEnd) + ":" + blockSizes + ":" + blockStarts
- 			posDup[coord] +=1
- 			
--		print >>sys.stderr, "report duplicte rate based on sequence ..."
--		print >>SEQ, "Occurrence\tUniqReadNumber"
--		for i in seqDup.values():			#key is occurence, value is uniq reads number (based on seq)
-+		print("report duplicte rate based on sequence ...", file=sys.stderr)
-+		print("Occurrence\tUniqReadNumber", file=SEQ)
-+		for i in list(seqDup.values()):			#key is occurence, value is uniq reads number (based on seq)
- 			seqDup_count[i] +=1
--		for k in sorted(seqDup_count.iterkeys()):	
--			print >>SEQ, str(k) +'\t'+ str(seqDup_count[k])
-+		for k in sorted(seqDup_count.keys()):	
-+			print(str(k) +'\t'+ str(seqDup_count[k]), file=SEQ)
- 		SEQ.close()
- 		
--		print >>sys.stderr, "report duplicte rate based on mapping  ..."
--		print >>POS, "Occurrence\tUniqReadNumber"
--		for i in posDup.values():			#key is occurence, value is uniq reads number (based on coord)
-+		print("report duplicte rate based on mapping  ...", file=sys.stderr)
-+		print("Occurrence\tUniqReadNumber", file=POS)
-+		for i in list(posDup.values()):			#key is occurence, value is uniq reads number (based on coord)
- 			posDup_count[i] +=1
--		for k in sorted(posDup_count.iterkeys()):	
--			print >>POS, str(k) +'\t'+ str(posDup_count[k])
-+		for k in sorted(posDup_count.keys()):	
-+			print(str(k) +'\t'+ str(posDup_count[k]), file=POS)
- 		POS.close()
- 		
- 		
--		print >>sys.stderr, "generate R script ..."
--		print >>RS, "pdf('duplicateRead.pdf')"
--		print >>RS, "par(mar=c(5,4,4,5),las=0)"
--		print >>RS, "seq_occ=c(" + ','.join([str(i) for i in sorted(seqDup_count.iterkeys()) ]) + ')'
--		print >>RS, "seq_uniqRead=c(" + ','.join([str(seqDup_count[i]) for i in sorted(seqDup_count.iterkeys()) ]) + ')'
--		print >>RS, "pos_occ=c(" + ','.join([str(i) for i in sorted(posDup_count.iterkeys()) ]) + ')'
--		print >>RS, "pos_uniqRead=c(" + ','.join([str(posDup_count[i]) for i in sorted(posDup_count.iterkeys()) ]) + ')'
--		print >>RS, "plot(pos_occ,log10(pos_uniqRead),ylab='Number of Reads (log10)',xlab='Frequency',pch=4,cex=0.8,col='blue',xlim=c(1,%d),yaxt='n')" % up_bound
--		print >>RS, "points(seq_occ,log10(seq_uniqRead),pch=20,cex=0.8,col='red')"
--		print >>RS, 'ym=floor(max(log10(pos_uniqRead)))'
--		print >>RS, "legend(%d,ym,legend=c('Sequence-base','Mapping-base'),col=c('red','blue'),pch=c(4,20))" % max(up_bound-200,1)
--		print >>RS, 'axis(side=2,at=0:ym,labels=0:ym)'
--		print >>RS, 'axis(side=4,at=c(log10(pos_uniqRead[1]),log10(pos_uniqRead[2]),log10(pos_uniqRead[3]),log10(pos_uniqRead[4])), labels=c(round(pos_uniqRead[1]*100/sum(pos_uniqRead)),round(pos_uniqRead[2]*100/sum(pos_uniqRead)),round(pos_uniqRead[3]*100/sum(pos_uniqRead)),round(pos_uniqRead[4]*100/sum(pos_uniqRead))))'
--		print >>RS, 'mtext(4, text = "Reads %", line = 2)'
-+		print("generate R script ...", file=sys.stderr)
-+		print("pdf('duplicateRead.pdf')", file=RS)
-+		print("par(mar=c(5,4,4,5),las=0)", file=RS)
-+		print("seq_occ=c(" + ','.join([str(i) for i in sorted(seqDup_count.keys()) ]) + ')', file=RS)
-+		print("seq_uniqRead=c(" + ','.join([str(seqDup_count[i]) for i in sorted(seqDup_count.keys()) ]) + ')', file=RS)
-+		print("pos_occ=c(" + ','.join([str(i) for i in sorted(posDup_count.keys()) ]) + ')', file=RS)
-+		print("pos_uniqRead=c(" + ','.join([str(posDup_count[i]) for i in sorted(posDup_count.keys()) ]) + ')', file=RS)
-+		print("plot(pos_occ,log10(pos_uniqRead),ylab='Number of Reads (log10)',xlab='Frequency',pch=4,cex=0.8,col='blue',xlim=c(1,%d),yaxt='n')" % up_bound, file=RS)
-+		print("points(seq_occ,log10(seq_uniqRead),pch=20,cex=0.8,col='red')", file=RS)
-+		print('ym=floor(max(log10(pos_uniqRead)))', file=RS)
-+		print("legend(%d,ym,legend=c('Sequence-base','Mapping-base'),col=c('red','blue'),pch=c(4,20))" % max(up_bound-200,1), file=RS)
-+		print('axis(side=2,at=0:ym,labels=0:ym)', file=RS)
-+		print('axis(side=4,at=c(log10(pos_uniqRead[1]),log10(pos_uniqRead[2]),log10(pos_uniqRead[3]),log10(pos_uniqRead[4])), labels=c(round(pos_uniqRead[1]*100/sum(pos_uniqRead)),round(pos_uniqRead[2]*100/sum(pos_uniqRead)),round(pos_uniqRead[3]*100/sum(pos_uniqRead)),round(pos_uniqRead[4]*100/sum(pos_uniqRead))))', file=RS)
-+		print('mtext(4, text = "Reads %", line = 2)', file=RS)
- 		#self.f.seek(0)
- 		
- 	def getUniqMapRead(self,outfile=None):
-@@ -655,7 +655,7 @@ class ParseSAM:
- 			outfile = self.fileName + ".uniq.sam"
- 		FO=open(outfile,'w')
- 		Uniqcount=0
--		print >>sys.stderr, "Writing uniquely mapped reads to\"",outfile,"\"... ",
-+		print("Writing uniquely mapped reads to\"",outfile,"\"... ", end=' ', file=sys.stderr)
- 		for line in self.f:
- 			hits=[]
- 			if line[0] == '@':continue						#skip head lines	
-@@ -667,11 +667,11 @@ class ParseSAM:
- 			#else:
- 				#print >>sys.stderr,line,
- 			if (ParseSAM._uniqueHit_pat.search(line)):
--				print >>sys.stderr,line,
-+				print(line, end=' ', file=sys.stderr)
- 				Uniqcount +=1
- 				FO.write(line)
- 		FO.close()
--		print >>sys.stderr, str(Uniqcount) + " reads were saved!\n",
-+		print(str(Uniqcount) + " reads were saved!\n", end=' ', file=sys.stderr)
- 		self.f.seek(0)
- 
- 	def getWrongStrand(self,outfile=None):
-@@ -680,7 +680,7 @@ class ParseSAM:
- 			outfile = self.fileName + ".wrongStrand.sam"
- 		FO=open(outfile,'w')
- 		wrongStrand=0
--		print >>sys.stderr, "Writing incorrectly stranded reads to\"",outfile,"\"... ",
-+		print("Writing incorrectly stranded reads to\"",outfile,"\"... ", end=' ', file=sys.stderr)
- 		for line in self.f:
- 			hits=[]
- 			if line.startswith('@'):continue						#skip head lines	
-@@ -701,7 +701,7 @@ class ParseSAM:
- 				wrongStrand+=1
- 
- 		FO.close()
--		print >>sys.stderr, str(wrongStrand) + " reads were saved!\n",
-+		print(str(wrongStrand) + " reads were saved!\n", end=' ', file=sys.stderr)
- 		self.f.seek(0)
- 		
- 	def filterSpliceRead(self,outfile=None,min_overhang=8,min_gap=50,max_gap=1000000):
-@@ -714,7 +714,7 @@ class ParseSAM:
- 			outfile = self.fileName + ".SR.sam"
- 			#outfile2 = self.fileName + ".SR.filter.sam"			
- 		splice_sites=collections.defaultdict(set)
--		print >>sys.stderr, "\tDetermine splice sites with proper overhang, intron size ... ",
-+		print("\tDetermine splice sites with proper overhang, intron size ... ", end=' ', file=sys.stderr)
- 		for line in self.f:
- 			if line[0] == '@':continue						#skip head lines	
- 			if ParseSAM._reExpr2.match(line):continue		#skip blank lines
-@@ -741,12 +741,12 @@ class ParseSAM:
- 					if (comb[2] >= min_overhang):
- 						splice_sites[chrom].add(map_st + comb[0] + comb[1])			
- 		self.f.seek(0)	
--		print >>sys.stderr, "Done"
-+		print("Done", file=sys.stderr)
- 		
- 		
- 		FO=open(outfile,'w')
- 		#FO2=open(outfile2,'w')
--		print >>sys.stderr, "\tExtracting splicing reads  ... ",
-+		print("\tExtracting splicing reads  ... ", end=' ', file=sys.stderr)
- 		total_SR =0
- 		extract_SR =0
- 		total_read =0
-@@ -778,10 +778,10 @@ class ParseSAM:
- 				else:
- 					#FO2.write(line)
- 					continue
--		print >>sys.stderr, "Done"
--		print >>sys.stderr, "\tTotal mapped Read: " + str(total_read)
--		print >>sys.stderr, "\tTotal Splicing Read: " + str(total_SR)
--		print >>sys.stderr, "\Usable Splicing Read: " + str(extract_SR)
-+		print("Done", file=sys.stderr)
-+		print("\tTotal mapped Read: " + str(total_read), file=sys.stderr)
-+		print("\tTotal Splicing Read: " + str(total_SR), file=sys.stderr)
-+		print("\\Usable Splicing Read: " + str(extract_SR), file=sys.stderr)
- 		FO.close()
- 		#FO2.close()
- 		self.f.seek(0)	
-@@ -792,7 +792,7 @@ class ParseSAM:
- 		if outfile is None:
- 			outfile = self.fileName + ".SR.sam"
- 		FO=open(outfile,'w')
--		print >>sys.stderr, "\tExtract splicing reads without any filter ...",
-+		print("\tExtract splicing reads without any filter ...", end=' ', file=sys.stderr)
- 		for line in self.f:
- 			if line[0] == '@':continue						#skip head lines	
- 			if ParseSAM._reExpr2.match(line):continue		#skip blank lines
-@@ -803,7 +803,7 @@ class ParseSAM:
- 			if (len(comb)>=3):
- 				FO.write(line)
- 		
--		print >>sys.stderr, "Done"
-+		print("Done", file=sys.stderr)
- 		self.f.seek(0)	
- 		FO.close()
- 
-@@ -812,7 +812,7 @@ class ParseSAM:
- 		The original SAM file must be sorted before hand. if not, using linux command like "sort -k3,3 -k4,4n myfile.sam >myfile.sorted.sam" '''
- 		if outfile is None:
- 			outfile = self.fileName + ".collapsed.sam"
--		print >>sys.stderr, "Writing collapsed SAM file to\"",outfile,"\"... "
-+		print("Writing collapsed SAM file to\"",outfile,"\"... ", file=sys.stderr)
- 		FO=open(outfile,'w')		
- 		flag=""
- 		for line in self.f:
-@@ -840,7 +840,7 @@ class ParseSAM:
- 		else:
- 			outfile = outfile + ".qual.plot.r"
- 		FO=open(outfile,'w')
--		print >>sys.stderr, "\tcalculating quality score ... "
-+		print("\tcalculating quality score ... ", file=sys.stderr)
- 		qual_min={}
- 		qual_max={}
- 		qual_sum={}
-@@ -875,16 +875,16 @@ class ParseSAM:
- 		max_qualities =[str(qual_max[i]) for i in range(0,read_len)]
- 		avg_qualities = [str(qual_sum[i]/total_read) for i in range(0,read_len)]
- 		nt_pos = [str(i) for i in range(0,read_len)]
--		print >>FO, "nt_pos=c(" + ','.join(nt_pos)  + ')'
--		print >>FO, "max_qual=c(" + ','.join(max_qualities)  + ')'
--		print >>FO, "min_qual=c(" + ','.join(min_qualities)  + ')'
--		print >>FO, "avg_qual=c(" + ','.join(avg_qualities)  + ')'
--		print >>FO, "pdf('phred_qual.pdf')"
--		print >>FO, "plot(nt_pos,avg_qual, xlab=\"Nucleotide Position (5'->3')\", ylab='Phred Quality',ylim=c(0,97),lwd=2,type='s')"
--		print >>FO, 'lines(nt_pos,max_qual,type="s",lwd=2,col="red")'
--		print >>FO, 'lines(nt_pos,min_qual,type="s",lwd=2,col="blue")'
--		print >>FO, 'legend(0,100,legend=c("Max","Average","Min"),col=c("red","black","blue"),lwd=2)'
--		print >>FO, 'dev.off()'
-+		print("nt_pos=c(" + ','.join(nt_pos)  + ')', file=FO)
-+		print("max_qual=c(" + ','.join(max_qualities)  + ')', file=FO)
-+		print("min_qual=c(" + ','.join(min_qualities)  + ')', file=FO)
-+		print("avg_qual=c(" + ','.join(avg_qualities)  + ')', file=FO)
-+		print("pdf('phred_qual.pdf')", file=FO)
-+		print("plot(nt_pos,avg_qual, xlab=\"Nucleotide Position (5'->3')\", ylab='Phred Quality',ylim=c(0,97),lwd=2,type='s')", file=FO)
-+		print('lines(nt_pos,max_qual,type="s",lwd=2,col="red")', file=FO)
-+		print('lines(nt_pos,min_qual,type="s",lwd=2,col="blue")', file=FO)
-+		print('legend(0,100,legend=c("Max","Average","Min"),col=c("red","black","blue"),lwd=2)', file=FO)
-+		print('dev.off()', file=FO)
- 		#for i in range(0,read_len):
- 		#	print >>sys.stderr, str(i) + '\t' + str(qual_max[i]) + '\t' + str(qual_min[i]) + '\t' + str(qual_sum[i]/total_read)
- 		#self.f.seek(0)
-@@ -918,7 +918,7 @@ class ParseSAM:
- 						scores[chrom][pos] =1
- 					else:
- 						scores[chrom][pos] +=1			
--			if lines % 10000 == 0: print >>sys.stderr, "%i lines loaded \r" % lines
-+			if lines % 10000 == 0: print("%i lines loaded \r" % lines, file=sys.stderr)
- 		return scores
- 		self.f.seek(0)
- 
-@@ -943,7 +943,7 @@ class QCSAM:
- 		The 5th column is number of reads fallen into the region defined by the first 3 columns'''
- 		
- 		if refbed is None:
--			print >>sys.stderr,"You must specify a bed file representing gene model\n"
-+			print("You must specify a bed file representing gene model\n", file=sys.stderr)
- 			exit(0)
- 		if outfile is None:
- 			exon_count = self.fileName + "_exon.count.bed"
-@@ -968,7 +968,7 @@ class QCSAM:
- 		splicedReads=0
- 		
- 		#read SAM 
--		print >>sys.stderr, "reading "+ self.fileName + '...',
-+		print("reading "+ self.fileName + '...', end=' ', file=sys.stderr)
- 		for line in self.f:
- 			if line.startswith("@"):continue
- 			fields=line.rstrip('\n ').split()
-@@ -990,10 +990,10 @@ class QCSAM:
- 					ranges[chrom].add_interval( Interval( mid, mid ) )
-     			
- 		self.f.seek(0)
--		print >>sys.stderr, "Done"
-+		print("Done", file=sys.stderr)
- 		
- 		#read refbed file
--		print >>sys.stderr, "Assign reads to "+ refbed + '...',
-+		print("Assign reads to "+ refbed + '...', end=' ', file=sys.stderr)
- 		for line in open(refbed,'r'):
- 			try:
- 				if line.startswith('#'):continue
-@@ -1007,14 +1007,14 @@ class QCSAM:
- 				geneName      = fields[3]
- 				strand    = fields[5].replace(" ","_")
- 				
--				exon_starts = map( int, fields[11].rstrip( ',\n' ).split( ',' ) )
--				exon_starts = map((lambda x: x + tx_start ), exon_starts)
--				exon_ends = map( int, fields[10].rstrip( ',\n' ).split( ',' ) )
--				exon_ends = map((lambda x, y: x + y ), exon_starts, exon_ends);   
-+				exon_starts = list(map( int, fields[11].rstrip( ',\n' ).split( ',' ) ))
-+				exon_starts = list(map((lambda x: x + tx_start ), exon_starts))
-+				exon_ends = list(map( int, fields[10].rstrip( ',\n' ).split( ',' ) ))
-+				exon_ends = list(map((lambda x, y: x + y ), exon_starts, exon_ends));   
- 				intron_starts = exon_ends[:-1]
- 				intron_ends=exon_starts[1:]
- 			except:
--				print >>sys.stderr,"[NOTE:input bed must be 12-column] skipped this line: " + line,
-+				print("[NOTE:input bed must be 12-column] skipped this line: " + line, end=' ', file=sys.stderr)
- 				continue
- 
- 				# assign reads to intron				
-@@ -1050,28 +1050,28 @@ class QCSAM:
- 						EXON_OUT.write(chrom + "\t" + str(st) + "\t" + str(end) + "\t" + geneName + "_exon_" + str(exonNum) + "\t" + str(hits) + "\t" + strand + '\n')
- 						exonNum += 1		
- 		intergenicReads=totalReads-exonReads-intronReads-splicedReads		
--		print >>sys.stderr, "Done." + '\n'
--		print >>sys.stderr, "Total reads:\t" + str(totalReads)
--		print >>sys.stderr, "Exonic reads:\t" + str(exonReads) 
--		print >>sys.stderr, "Intronic reads:\t" + str(intronReads) 
--		print >>sys.stderr, "Splicing reads:\t" + str(splicedReads)
--		print >>sys.stderr, "Intergenic reads:\t" + str(intergenicReads)
-+		print("Done." + '\n', file=sys.stderr)
-+		print("Total reads:\t" + str(totalReads), file=sys.stderr)
-+		print("Exonic reads:\t" + str(exonReads), file=sys.stderr) 
-+		print("Intronic reads:\t" + str(intronReads), file=sys.stderr) 
-+		print("Splicing reads:\t" + str(splicedReads), file=sys.stderr)
-+		print("Intergenic reads:\t" + str(intergenicReads), file=sys.stderr)
- 		
--		print >>sys.stderr,"writing R script ...",
-+		print("writing R script ...", end=' ', file=sys.stderr)
- 		totalReads=float(totalReads)
--		print >>R_OUT, "pdf('%s')" % rpdf
--		print >>R_OUT, "dat=c(%d,%d,%d,%d)" % (exonReads,splicedReads,intronReads,intergenicReads)
--		print >>R_OUT, "lb=c('exon(%.2f)','junction(%.2f)','intron(%.2f)','intergenic(%.2f)')" % (exonReads/totalReads,splicedReads/totalReads,intronReads/totalReads,intergenicReads/totalReads)
--		print >>R_OUT, "pie(dat,labels=lb,col=rainbow(4),clockwise=TRUE,main='Total reads = %d')" % int(totalReads)
--		print >>R_OUT, "dev.off()"
--		print >>sys.stderr, "Done."
-+		print("pdf('%s')" % rpdf, file=R_OUT)
-+		print("dat=c(%d,%d,%d,%d)" % (exonReads,splicedReads,intronReads,intergenicReads), file=R_OUT)
-+		print("lb=c('exon(%.2f)','junction(%.2f)','intron(%.2f)','intergenic(%.2f)')" % (exonReads/totalReads,splicedReads/totalReads,intronReads/totalReads,intergenicReads/totalReads), file=R_OUT)
-+		print("pie(dat,labels=lb,col=rainbow(4),clockwise=TRUE,main='Total reads = %d')" % int(totalReads), file=R_OUT)
-+		print("dev.off()", file=R_OUT)
-+		print("Done.", file=sys.stderr)
- 	
- 	
- 	def coverageGeneBody(self,refbed,outfile=None):
- 		'''Calculate reads coverage over gene body, from 5'to 3'. each gene will be equally divied
- 		into 100 regsions'''
- 		if refbed is None:
--			print >>sys.stderr,"You must specify a bed file representing gene model\n"
-+			print("You must specify a bed file representing gene model\n", file=sys.stderr)
- 			exit(0)
- 		if outfile is None:
- 			outfile1 = self.fileName + ".geneBodyCoverage_plot.r"
-@@ -1088,7 +1088,7 @@ class QCSAM:
- 		rpkm={}
- 		
- 		#read SAM 
--		print >>sys.stderr, "reading "+ self.fileName + '...',
-+		print("reading "+ self.fileName + '...', end=' ', file=sys.stderr)
- 		for line in self.f:
- 			if line.startswith("@"):continue
- 			fields=line.rstrip('\n ').split()
-@@ -1114,9 +1114,9 @@ class QCSAM:
- 					ranges[chrom] = Intersecter()
- 				else:
- 					ranges[chrom].add_interval( Interval( st, st+size ) )
--		print >>sys.stderr, "Done"   	
-+		print("Done", file=sys.stderr)   	
- 
--		print >>sys.stderr, "calculating coverage over gene body ..."
-+		print("calculating coverage over gene body ...", file=sys.stderr)
- 		coverage=collections.defaultdict(int)
- 		flag=0
- 		for line in open(refbed,'r'):
-@@ -1130,19 +1130,19 @@ class QCSAM:
- 				geneName      = fields[3]
- 				strand    = fields[5]
- 				
--				exon_starts = map( int, fields[11].rstrip( ',\n' ).split( ',' ) )
--				exon_starts = map((lambda x: x + tx_start ), exon_starts)
--				exon_ends = map( int, fields[10].rstrip( ',\n' ).split( ',' ) )
--				exon_ends = map((lambda x, y: x + y ), exon_starts, exon_ends);   
-+				exon_starts = list(map( int, fields[11].rstrip( ',\n' ).split( ',' ) ))
-+				exon_starts = list(map((lambda x: x + tx_start ), exon_starts))
-+				exon_ends = list(map( int, fields[10].rstrip( ',\n' ).split( ',' ) ))
-+				exon_ends = list(map((lambda x, y: x + y ), exon_starts, exon_ends));   
- 			except:
--				print >>sys.stderr,"[NOTE:input bed must be 12-column] skipped this line: " + line,
-+				print("[NOTE:input bed must be 12-column] skipped this line: " + line, end=' ', file=sys.stderr)
- 				continue
- 			gene_all_base=[]
- 			percentile_base=[]
- 			mRNA_len =0
- 			flag=0
- 			for st,end in zip(exon_starts,exon_ends):
--				gene_all_base.extend(range(st+1,end+1))		#0-based coordinates on genome
-+				gene_all_base.extend(list(range(st+1,end+1)))		#0-based coordinates on genome
- 				mRNA_len = len(gene_all_base)
- 				if mRNA_len <100:
- 					flag=1
-@@ -1159,18 +1159,18 @@ class QCSAM:
- 					coverage[i] += len(ranges[chrom].find(percentile_base[i], percentile_base[i]+1))
- 		x_coord=[]
- 		y_coord=[]
--		print >>OUT2, "Total reads: " + str(totalReads)
--		print >>OUT2, "Fragment number: " + str(fragment_num)
--		print >>OUT2, "percentile\tcount"
-+		print("Total reads: " + str(totalReads), file=OUT2)
-+		print("Fragment number: " + str(fragment_num), file=OUT2)
-+		print("percentile\tcount", file=OUT2)
- 		for i in coverage:
- 			x_coord.append(str(i))
- 			y_coord.append(str(coverage[i]))
--			print >>OUT2, str(i) + '\t' + str(coverage[i])
--		print >>OUT1, "pdf('geneBody_coverage.pdf')"
--		print >>OUT1, "x=0:100"
--		print >>OUT1, "y=c(" + ','.join(y_coord) + ')'
--		print >>OUT1, "plot(x,y,xlab=\"percentile of gene body (5'->3')\",ylab='read number',type='s')"
--		print >>OUT1, "dev.off()"
-+			print(str(i) + '\t' + str(coverage[i]), file=OUT2)
-+		print("pdf('geneBody_coverage.pdf')", file=OUT1)
-+		print("x=0:100", file=OUT1)
-+		print("y=c(" + ','.join(y_coord) + ')', file=OUT1)
-+		print("plot(x,y,xlab=\"percentile of gene body (5'->3')\",ylab='read number',type='s')", file=OUT1)
-+		print("dev.off()", file=OUT1)
- 			
- 	def calculateRPKM(self,refbed,outfile=None):
- 		'''calculate RPKM values for each gene in refbed. Only uniquely aligned reads are used. 
-@@ -1178,7 +1178,7 @@ class QCSAM:
- 		exon per Million mapped reads) for each exon, intron and mRNA'''
- 		
- 		if refbed is None:
--			print >>sys.stderr,"You must specify a bed file representing gene model\n"
-+			print("You must specify a bed file representing gene model\n", file=sys.stderr)
- 			exit(0)
- 		if outfile is None:
- 			rpkm_file = self.fileName + ".rpkm.xls"
-@@ -1194,7 +1194,7 @@ class QCSAM:
- 		rpkm={}
- 		
- 		#read SAM 
--		print >>sys.stderr, "reading "+ self.fileName + '...',
-+		print("reading "+ self.fileName + '...', end=' ', file=sys.stderr)
- 		for line in self.f:
- 			if line.startswith("@"):continue
- 			fields=line.rstrip('\n ').split()
-@@ -1228,17 +1228,17 @@ class QCSAM:
- 					ranges[chrom].add_interval( Interval( mid, mid ) )
-     			
- 		self.f.seek(0)
--		print >>sys.stderr, "Done"
--		print >>RPKM_OUT, "Total mapped reads (TR): " + str(totalReads) 
--		print >>RPKM_OUT, "Multiple mapped reads (MR): " + str(multiMapReads)
--		print >>RPKM_OUT, "Uniquely mapped reads (UR): " + str(totalReads - multiMapReads)
--		print >>RPKM_OUT, "Spliced  mapped reads (SR): " + str(sR)
--		print >>RPKM_OUT, "Corrected uniquely mapped reads (cUR): " + str(cUR)
-+		print("Done", file=sys.stderr)
-+		print("Total mapped reads (TR): " + str(totalReads), file=RPKM_OUT) 
-+		print("Multiple mapped reads (MR): " + str(multiMapReads), file=RPKM_OUT)
-+		print("Uniquely mapped reads (UR): " + str(totalReads - multiMapReads), file=RPKM_OUT)
-+		print("Spliced  mapped reads (SR): " + str(sR), file=RPKM_OUT)
-+		print("Corrected uniquely mapped reads (cUR): " + str(cUR), file=RPKM_OUT)
- 		if totalReads ==0:
- 			sys.exit(1)
- 		
- 		#read refbed file
--		print >>sys.stderr, "Assign reads to "+ refbed + '...',
-+		print("Assign reads to "+ refbed + '...', end=' ', file=sys.stderr)
- 		for line in open(refbed,'r'):
- 			try:
- 				if line.startswith('#'):continue
-@@ -1252,16 +1252,16 @@ class QCSAM:
- 				geneName      = fields[3]
- 				strand    = fields[5].replace(" ","_")
- 				
--				exon_starts = map( int, fields[11].rstrip( ',\n' ).split( ',' ) )
--				exon_starts = map((lambda x: x + tx_start ), exon_starts)
--				exon_ends = map( int, fields[10].rstrip( ',\n' ).split( ',' ) )
--				exon_ends = map((lambda x, y: x + y ), exon_starts, exon_ends)
--				exon_sizes = map(int,fields[10].rstrip(',\n').split(','))
-+				exon_starts = list(map( int, fields[11].rstrip( ',\n' ).split( ',' ) ))
-+				exon_starts = list(map((lambda x: x + tx_start ), exon_starts))
-+				exon_ends = list(map( int, fields[10].rstrip( ',\n' ).split( ',' ) ))
-+				exon_ends = list(map((lambda x, y: x + y ), exon_starts, exon_ends))
-+				exon_sizes = list(map(int,fields[10].rstrip(',\n').split(',')))
- 				intron_starts = exon_ends[:-1]
- 				intron_ends=exon_starts[1:]
- 				key='\t'.join((chrom.lower(),str(tx_start),str(tx_end),geneName,'0',strand))
- 			except:
--				print >>sys.stderr,"[NOTE:input bed must be 12-column] skipped this line: " + line,
-+				print("[NOTE:input bed must be 12-column] skipped this line: " + line, end=' ', file=sys.stderr)
- 				continue
- 
- 			# assign reads to intron				
-@@ -1309,7 +1309,7 @@ class QCSAM:
- 				except:
- 					RPKM_OUT.write(chrom.lower() + "\t" + str(tx_start) + "\t" + str(tx_end) + "\t" + geneName + "_mRNA" + "\t" + str(0) + "\t" + strand + '\t' +  str(0) +'\n')
- 					rpkm[key] = 0
--		print >>sys.stderr, "Done"
-+		print("Done", file=sys.stderr)
- 		return rpkm
- 		self.f.seek(0)
- 
-@@ -1320,7 +1320,7 @@ class QCSAM:
- 		NOTE: intronic reads are not counted as part of total reads'''
- 		
- 		if refbed is None:
--			print >>sys.stderr,"You must specify a bed file representing gene model\n"
-+			print("You must specify a bed file representing gene model\n", file=sys.stderr)
- 			exit(0)
- 		if outfile is None:
- 			rpkm_file = self.fileName + ".rpkm.xls"
-@@ -1338,7 +1338,7 @@ class QCSAM:
- 		rpkm={}
- 		
- 		#read gene model file, the purpose is to remove intronic reads
--		print >>sys.stderr, "Reading reference gene model "+ refbed + '...'
-+		print("Reading reference gene model "+ refbed + '...', file=sys.stderr)
- 		for line in open(refbed,'r'):
- 			try:
- 				if line.startswith(('#','track','browser')):continue
-@@ -1351,12 +1351,12 @@ class QCSAM:
- 				geneName      = fields[3]
- 				strand    = fields[5].replace(" ","_")
- 				
--				exon_starts = map( int, fields[11].rstrip( ',\n' ).split( ',' ) )
--				exon_starts = map((lambda x: x + tx_start ), exon_starts)
--				exon_ends = map( int, fields[10].rstrip( ',\n' ).split( ',' ) )
--				exon_ends = map((lambda x, y: x + y ), exon_starts, exon_ends);   
-+				exon_starts = list(map( int, fields[11].rstrip( ',\n' ).split( ',' ) ))
-+				exon_starts = list(map((lambda x: x + tx_start ), exon_starts))
-+				exon_ends = list(map( int, fields[10].rstrip( ',\n' ).split( ',' ) ))
-+				exon_ends = list(map((lambda x, y: x + y ), exon_starts, exon_ends));   
- 			except:
--				print >>sys.stderr,"[NOTE:input bed must be 12-column] skipped this line: " + line,
-+				print("[NOTE:input bed must be 12-column] skipped this line: " + line, end=' ', file=sys.stderr)
- 				continue	
- 
- 			for st,end in zip(exon_starts,exon_ends):				
-@@ -1366,7 +1366,7 @@ class QCSAM:
- 					exon_ranges[chrom].add_interval( Interval( st, end ) )		
- 
- 		#read SAM 
--		print >>sys.stderr, "reading "+ self.fileName + '...',
-+		print("reading "+ self.fileName + '...', end=' ', file=sys.stderr)
- 		for line in self.f:
- 			if line.startswith("@"):continue
- 			fields=line.rstrip('\n ').split()
-@@ -1401,22 +1401,22 @@ class QCSAM:
- 						ranges[chrom] = Intersecter()
- 					else:
- 						ranges[chrom].add_interval( Interval( mid, mid ) )
--    			else:																			#if this framgnet is intronic, skip it.
-+			else:																			#if this framgnet is intronic, skip it.
-     				#intronic +=1
--    				continue	
-+ 				continue	
- 		self.f.seek(0)
--		print >>sys.stderr, "Done"
--		print >>RPKM_OUT, "Total mapped reads (TR): " + str(totalReads) 
--		print >>RPKM_OUT, "Multiple mapped reads (MR): " + str(multiMapReads)
--		print >>RPKM_OUT, "Uniquely mapped reads (UR): " + str(totalReads - multiMapReads)
--		print >>RPKM_OUT, "Spliced  mapped reads (SR): " + str(sR)
--		print >>RPKM_OUT, "Corrected uniquely mapped reads (cUR, non-intronic fragments): " + str(cUR)
-+		print("Done", file=sys.stderr)
-+		print("Total mapped reads (TR): " + str(totalReads), file=RPKM_OUT) 
-+		print("Multiple mapped reads (MR): " + str(multiMapReads), file=RPKM_OUT)
-+		print("Uniquely mapped reads (UR): " + str(totalReads - multiMapReads), file=RPKM_OUT)
-+		print("Spliced  mapped reads (SR): " + str(sR), file=RPKM_OUT)
-+		print("Corrected uniquely mapped reads (cUR, non-intronic fragments): " + str(cUR), file=RPKM_OUT)
- 		#print >>RPKM_OUT, "Intronic Fragments (IF): " + str(intronic)
- 		if totalReads ==0:
- 			sys.exit(1)
- 		
- 		#read refbed file
--		print >>sys.stderr, "Assign reads to "+ refbed + '...',
-+		print("Assign reads to "+ refbed + '...', end=' ', file=sys.stderr)
- 		for line in open(refbed,'r'):
- 			try:
- 				if line.startswith('#'):continue
-@@ -1430,16 +1430,16 @@ class QCSAM:
- 				geneName      = fields[3]
- 				strand    = fields[5].replace(" ","_")
- 				
--				exon_starts = map( int, fields[11].rstrip( ',\n' ).split( ',' ) )
--				exon_starts = map((lambda x: x + tx_start ), exon_starts)
--				exon_ends = map( int, fields[10].rstrip( ',\n' ).split( ',' ) )
--				exon_ends = map((lambda x, y: x + y ), exon_starts, exon_ends)
--				exon_sizes = map(int,fields[10].rstrip(',\n').split(','))
-+				exon_starts = list(map( int, fields[11].rstrip( ',\n' ).split( ',' ) ))
-+				exon_starts = list(map((lambda x: x + tx_start ), exon_starts))
-+				exon_ends = list(map( int, fields[10].rstrip( ',\n' ).split( ',' ) ))
-+				exon_ends = list(map((lambda x, y: x + y ), exon_starts, exon_ends))
-+				exon_sizes = list(map(int,fields[10].rstrip(',\n').split(',')))
- 				intron_starts = exon_ends[:-1]
- 				intron_ends=exon_starts[1:]
- 				key='\t'.join((chrom.lower(),str(tx_start),str(tx_end),geneName,'0',strand))
- 			except:
--				print >>sys.stderr,"[NOTE:input bed must be 12-column] skipped this line: " + line,
-+				print("[NOTE:input bed must be 12-column] skipped this line: " + line, end=' ', file=sys.stderr)
- 				continue
- 
- 			# assign reads to intron				
-@@ -1487,7 +1487,7 @@ class QCSAM:
- 				except:
- 					RPKM_OUT.write(chrom.lower() + "\t" + str(tx_start) + "\t" + str(tx_end) + "\t" + geneName + "_mRNA" + "\t" + str(0) + "\t" + strand + '\t' +  str(0) +'\n')
- 					rpkm[key] = 0
--		print >>sys.stderr, "Done"
-+		print("Done", file=sys.stderr)
- 		return rpkm
- 		self.f.seek(0)
- 
-@@ -1499,7 +1499,7 @@ class QCSAM:
- 		unknownReads=0
- 		ranges={}
- 		if refbed is None:
--			print >>sys.stderr,"You must specify a bed file representing gene model\n"
-+			print("You must specify a bed file representing gene model\n", file=sys.stderr)
- 			exit(0)
- 		
- 		if outfile is None:
-@@ -1508,7 +1508,7 @@ class QCSAM:
- 			out_file = outfile + ".unknownReads.SAM"	
- 		OUT=open(out_file,'w')
- 		
--		print >>sys.stderr, "Reading reference gene model "+ refbed + '...'
-+		print("Reading reference gene model "+ refbed + '...', file=sys.stderr)
- 		for line in open(refbed,'r'):
- 			try:
- 				if line.startswith(('#','track','browser')):continue
-@@ -1521,12 +1521,12 @@ class QCSAM:
- 				geneName      = fields[3]
- 				strand    = fields[5].replace(" ","_")
- 				
--				exon_starts = map( int, fields[11].rstrip( ',\n' ).split( ',' ) )
--				exon_starts = map((lambda x: x + tx_start ), exon_starts)
--				exon_ends = map( int, fields[10].rstrip( ',\n' ).split( ',' ) )
--				exon_ends = map((lambda x, y: x + y ), exon_starts, exon_ends);   
-+				exon_starts = list(map( int, fields[11].rstrip( ',\n' ).split( ',' ) ))
-+				exon_starts = list(map((lambda x: x + tx_start ), exon_starts))
-+				exon_ends = list(map( int, fields[10].rstrip( ',\n' ).split( ',' ) ))
-+				exon_ends = list(map((lambda x, y: x + y ), exon_starts, exon_ends));   
- 			except:
--				print >>sys.stderr,"[NOTE:input bed must be 12-column] skipped this line: " + line,
-+				print("[NOTE:input bed must be 12-column] skipped this line: " + line, end=' ', file=sys.stderr)
- 				continue	
- 
- 			for st,end in zip(exon_starts,exon_ends):				
-@@ -1535,7 +1535,7 @@ class QCSAM:
- 				else:
- 					ranges[chrom].add_interval( Interval( st, end ) )		
- 
--		print >>sys.stderr, "Processing SAM file "+ self.fileName + '...'
-+		print("Processing SAM file "+ self.fileName + '...', file=sys.stderr)
- 		for line in self.f:
- 			if line.startswith("@"):continue
- 			fields=line.rstrip('\n ').split()
-@@ -1564,8 +1564,8 @@ class QCSAM:
- 				OUT.write(line)
- 				unknownReads +=1
- 		OUT.close()
--		print >>sys.stderr, "Total reads mapped to genome: " + str(totalReads)
--		print >>sys.stderr, "Total reads not overlapped with any exon: " + str(unknownReads)
-+		print("Total reads mapped to genome: " + str(totalReads), file=sys.stderr)
-+		print("Total reads not overlapped with any exon: " + str(unknownReads), file=sys.stderr)
- 		self.f.seek(0)
- 
- 	def genomicFragSize(self,outfile=None,low_bound=0,up_bound=1000,step=10):
-@@ -1589,16 +1589,16 @@ class QCSAM:
- 		ranges={}
- 		ranges[chrom]=Intersecter()
- 		
--		window_left_bound = range(low_bound,up_bound,step)
-- 		frag_size=0
-+		window_left_bound = list(range(low_bound,up_bound,step))
-+		frag_size=0
- 
-- 		pair_num=0.0
-- 		ultra_low=0.0
-- 		ultra_high=0.0
-- 		size=[]
-- 		counts=[]
-- 		count=0
--		print >>sys.stderr, "Reading SAM file "+ self.fileName + ' ... ',
-+		pair_num=0.0
-+		ultra_low=0.0
-+		ultra_high=0.0
-+		size=[]
-+		counts=[]
-+		count=0
-+		print("Reading SAM file "+ self.fileName + ' ... ', end=' ', file=sys.stderr)
- 		for line in self.f:
- 			if line.startswith("@"):continue
- 			fields=line.rstrip('\n ').split()
-@@ -1606,7 +1606,7 @@ class QCSAM:
- 			#	continue
- 			flagCode=string.atoi(fields[1])
- 			if (flagCode & 0x0001) ==0:
--				print >>sys.stderr,"NOT pair-end sequencing"
-+				print("NOT pair-end sequencing", file=sys.stderr)
- 				sys.exit(1)
- 			if (flagCode & 0x0004) != 0: continue			#skip unmap reads
- 			if not ParseSAM._uniqueHit_pat.search(line):	#skip multiple mapped reads
-@@ -1632,29 +1632,29 @@ class QCSAM:
- 				ultra_high +=1
- 				continue
- 			ranges[chrom].add_interval( Interval( frag_size-1, frag_size ) )
--		print >>sys.stderr, "Done"
-+		print("Done", file=sys.stderr)
- 		
- 		if pair_num==0:
--			print >>sys.stderr, "Cannot find paired reads"
-+			print("Cannot find paired reads", file=sys.stderr)
- 			sys.exit(0)
--		print >>FQ, "Total paired read " + str(pair_num)
--		print >>FQ, "<=" + str(low_bound) + "\t"+ str(ultra_low)
-+		print("Total paired read " + str(pair_num), file=FQ)
-+		print("<=" + str(low_bound) + "\t"+ str(ultra_low), file=FQ)
- 		for st in window_left_bound:
- 			size.append(str(st + step/2))
- 			count = str(len(ranges[chrom].find(st,st + step)))
- 			counts.append(count)
--			print >>FQ, str(st) + '\t' + str(st+step) +'\t' + count		
--		print >>FQ, ">" + str(up_bound) + "\t"+ str(ultra_high)
-+			print(str(st) + '\t' + str(st+step) +'\t' + count, file=FQ)		
-+		print(">" + str(up_bound) + "\t"+ str(ultra_high), file=FQ)
- 		
--		print >>RS, "pdf('gFragSize.pdf')"
--		print >>RS, "par(mfrow=c(2,1),cex.main=0.8,cex.lab=0.8,cex.axis=0.8,mar=c(4,4,4,1))"
--		print >>RS, 'pie(c(%d,%d,%d),col=rainbow(3),cex=0.5,radius=1,main="Total %d fragments",labels=c("fraSize <= %d\\n(%4.2f%%)","fragSize > %d\\n(%4.2f%%)","%d < fragSize <= %d\\n(%4.2f%%)"), density=rep(80,80,80),angle=c(90,140,170))' % (ultra_low, ultra_high, pair_num -ultra_low -ultra_high, pair_num, low_bound, ultra_low*100/pair_num, up_bound, ultra_high*100/pair_num, low_bound, up_bound, 100-ultra_low*100/pair_num - ultra_high*100/pair_num)
--		print >>RS, 'fragsize=rep(c(' + ','.join(size) + '),' + 'times=c(' + ','.join(counts) + '))'
--		print >>RS, 'frag_sd = round(sd(fragsize))'
--		print >>RS, 'frag_mean = round(mean(fragsize))'
--		print >>RS, 'hist(fragsize,probability=T,breaks=%d,xlab="Fragment size (bp)",main=paste(c("Mean=",frag_mean,";","SD=",frag_sd),collapse=""),border="blue")' % len(window_left_bound)
--		print >>RS, "lines(density(fragsize,bw=%d),col='red')" % (2*step)
--		print >>RS ,"dev.off()"
-+		print("pdf('gFragSize.pdf')", file=RS)
-+		print("par(mfrow=c(2,1),cex.main=0.8,cex.lab=0.8,cex.axis=0.8,mar=c(4,4,4,1))", file=RS)
-+		print('pie(c(%d,%d,%d),col=rainbow(3),cex=0.5,radius=1,main="Total %d fragments",labels=c("fraSize <= %d\\n(%4.2f%%)","fragSize > %d\\n(%4.2f%%)","%d < fragSize <= %d\\n(%4.2f%%)"), density=rep(80,80,80),angle=c(90,140,170))' % (ultra_low, ultra_high, pair_num -ultra_low -ultra_high, pair_num, low_bound, ultra_low*100/pair_num, up_bound, ultra_high*100/pair_num, low_bound, up_bound, 100-ultra_low*100/pair_num - ultra_high*100/pair_num), file=RS)
-+		print('fragsize=rep(c(' + ','.join(size) + '),' + 'times=c(' + ','.join(counts) + '))', file=RS)
-+		print('frag_sd = round(sd(fragsize))', file=RS)
-+		print('frag_mean = round(mean(fragsize))', file=RS)
-+		print('hist(fragsize,probability=T,breaks=%d,xlab="Fragment size (bp)",main=paste(c("Mean=",frag_mean,";","SD=",frag_sd),collapse=""),border="blue")' % len(window_left_bound), file=RS)
-+		print("lines(density(fragsize,bw=%d),col='red')" % (2*step), file=RS)
-+		print("dev.off()", file=RS)
- 		FO.close()
- 		FQ.close()
- 		RS.close()
-@@ -1665,7 +1665,7 @@ class QCSAM:
- 		'''for each gene, check if its RPKM (epxresion level) has already been saturated or not'''
- 		
- 		if refbed is None:
--			print >>sys.stderr,"You must specify a bed file representing gene model\n"
-+			print("You must specify a bed file representing gene model\n", file=sys.stderr)
- 			exit(0)
- 		if outfile is None:
- 			rpkm_file = self.fileName + ".eRPKM.xls"
-@@ -1685,7 +1685,7 @@ class QCSAM:
- 		#read SAM 
- 		my_pat = re.compile(r'NH:i:(\d+)\b')
- 		NH_tag=0
--		print >>sys.stderr, "Reading "+ self.fileName + '...',
-+		print("Reading "+ self.fileName + '...', end=' ', file=sys.stderr)
- 		for line in self.f:
- 			if line.startswith("@"):continue
- 			fields=line.rstrip('\n ').split()
-@@ -1698,7 +1698,7 @@ class QCSAM:
- 			elif len(hitNum) ==1:
- 				if int(hitNum[0])>1: continue				#skip multiple mapped reads
- 			else:
--				print >>sys.stderr, "More than 1 NH tag found within a single line. Incorrect SAM format!"
-+				print("More than 1 NH tag found within a single line. Incorrect SAM format!", file=sys.stderr)
- 				sys.exit(1)
- 
- 			chrom = fields[2].upper()
-@@ -1719,12 +1719,12 @@ class QCSAM:
- 				block_list.append(chrom + ":" + str(mid))
- 		
- 		if NH_tag==1:
--			print >>sys.stderr, "Warn: NO NH tag found. Cannot determine uniqueness of alignment. All alignments will be used"
--		print >>sys.stderr, "Done"
-+			print("Warn: NO NH tag found. Cannot determine uniqueness of alignment. All alignments will be used", file=sys.stderr)
-+		print("Done", file=sys.stderr)
- 		
--		print >>sys.stderr, "shuffling alignments ...",
-+		print("shuffling alignments ...", end=' ', file=sys.stderr)
- 		random.shuffle(block_list)
--		print >>sys.stderr, "Done"
-+		print("Done", file=sys.stderr)
- 		
- 		
- 		ranges={}
-@@ -1734,7 +1734,7 @@ class QCSAM:
- 		rawCount_table=collections.defaultdict(list)
- 		RPKM_head=['chr','start','end','name','score','strand']
- 
--		tmp=range(sample_start,sample_end,sample_step)
-+		tmp=list(range(sample_start,sample_end,sample_step))
- 		tmp.append(100)
- 		#=========================sampling uniquely mapped reads from population
- 		for pertl in tmp:	#[5, 10, 15, 20, 25, 30, 35, 40, 45, 50, 55, 60, 65, 70, 75, 80, 85, 90, 95,100]
-@@ -1744,7 +1744,7 @@ class QCSAM:
- 			sample_size += index_end -index_st
- 			
- 			RPKM_head.append(str(pertl) + '%')
--			print >>sys.stderr, "sampling " + str(pertl) +"% (" + str(sample_size) + ") fragments ...",
-+			print("sampling " + str(pertl) +"% (" + str(sample_size) + ") fragments ...", end=' ', file=sys.stderr)
- 			for i in range(index_st, index_end):
- 				(chr,coord) = block_list[i].split(':')
- 				if chr not in ranges:
-@@ -1763,14 +1763,14 @@ class QCSAM:
- 					tx_end    = int( fields[2] )
- 					geneName      = fields[3]
- 					strand    = fields[5].replace(" ","_")
--					exon_starts = map( int, fields[11].rstrip( ',\n' ).split( ',' ) )
--					exon_starts = map((lambda x: x + tx_start ), exon_starts)
--					exon_ends = map( int, fields[10].rstrip( ',\n' ).split( ',' ) )
--					exon_ends = map((lambda x, y: x + y ), exon_starts, exon_ends)
--					exon_sizes = map(int,fields[10].rstrip(',\n').split(','))
-+					exon_starts = list(map( int, fields[11].rstrip( ',\n' ).split( ',' ) ))
-+					exon_starts = list(map((lambda x: x + tx_start ), exon_starts))
-+					exon_ends = list(map( int, fields[10].rstrip( ',\n' ).split( ',' ) ))
-+					exon_ends = list(map((lambda x, y: x + y ), exon_starts, exon_ends))
-+					exon_sizes = list(map(int,fields[10].rstrip(',\n').split(',')))
- 					key='\t'.join((chrom.lower(),str(tx_start),str(tx_end),geneName,'0',strand))
- 				except:
--					print >>sys.stderr,"[NOTE:input bed must be 12-column] skipped this line: " + line
-+					print("[NOTE:input bed must be 12-column] skipped this line: " + line, file=sys.stderr)
- 					continue
- 				mRNA_count=0	#we need to initializ it to 0 for each gene
- 				mRNA_len=sum(exon_sizes)
-@@ -1778,24 +1778,24 @@ class QCSAM:
- 					if chrom in ranges:
- 						mRNA_count += len(ranges[chrom].find(st,end))		
- 				if mRNA_len ==0:
--					print >>sys.stderr, geneName + " has 0 nucleotides. Exit!"
-+					print(geneName + " has 0 nucleotides. Exit!", file=sys.stderr)
- 					sys.exit(1)
- 				if sample_size == 0:
--					print >>sys.stderr, "Too few reads to sample. Exit!"
-+					print("Too few reads to sample. Exit!", file=sys.stderr)
- 					sys.exit(1)
- 				mRNA_RPKM = (mRNA_count * 1000000000.0)/(mRNA_len * sample_size)
- 				RPKM_table[key].append(str(mRNA_RPKM))
- 				rawCount_table[key].append(str(mRNA_count))
--			print >>sys.stderr, "Done"
-+			print("Done", file=sys.stderr)
- 
- 		#self.f.seek(0)
--		print >>RPKM_OUT, '\t'.join(RPKM_head)
--		print >>RAW_OUT, '\t'.join(RPKM_head)
-+		print('\t'.join(RPKM_head), file=RPKM_OUT)
-+		print('\t'.join(RPKM_head), file=RAW_OUT)
- 		for key in RPKM_table:
--			print >>RPKM_OUT, key + '\t',
--			print >>RPKM_OUT, '\t'.join(RPKM_table[key])
--			print >>RAW_OUT, key + '\t',
--			print >>RAW_OUT, '\t'.join(rawCount_table[key])			
-+			print(key + '\t', end=' ', file=RPKM_OUT)
-+			print('\t'.join(RPKM_table[key]), file=RPKM_OUT)
-+			print(key + '\t', end=' ', file=RAW_OUT)
-+			print('\t'.join(rawCount_table[key]), file=RAW_OUT)			
- 
- 	def saturation_junction(self,refgene,outfile=None,sample_start=5,sample_step=5,sample_end=100,min_intron=50,recur=1):
- 		'''check if an RNA-seq experiment is saturated in terms of detecting known splicing junction'''
-@@ -1805,7 +1805,7 @@ class QCSAM:
- 		else:
- 			out_file = outfile + ".junctionSaturation_plot.r"
- 		if refgene is None:
--			print >>sys.stderr, "You must provide reference gene model in bed format."
-+			print("You must provide reference gene model in bed format.", file=sys.stderr)
- 			sys.exit(1)
- 		
- 		OUT = open(out_file,'w')
-@@ -1813,12 +1813,12 @@ class QCSAM:
- 
- 		#reading reference gene 
- 		knownSpliceSites= set()
--		print >>sys.stderr, "reading reference bed file: ",refgene, " ... ",
-+		print("reading reference bed file: ",refgene, " ... ", end=' ', file=sys.stderr)
- 		for line in open(refgene,'r'):
- 			if line.startswith(('#','track','browser')):continue  
- 			fields = line.split()
- 			if(len(fields)<12):
--				print >>sys.stderr, "Invalid bed line (skipped):",line,
-+				print("Invalid bed line (skipped):",line, end=' ', file=sys.stderr)
- 				continue
- 			chrom     = fields[0].upper()
- 			tx_start = int( fields[1] )
-@@ -1826,15 +1826,15 @@ class QCSAM:
- 			if int(fields[9] ==1):
- 				continue    	
- 			
--			exon_starts = map( int, fields[11].rstrip( ',\n' ).split( ',' ) )
--			exon_starts = map((lambda x: x + tx_start ), exon_starts)
--			exon_ends = map( int, fields[10].rstrip( ',\n' ).split( ',' ) )
--			exon_ends = map((lambda x, y: x + y ), exon_starts, exon_ends);   
-+			exon_starts = list(map( int, fields[11].rstrip( ',\n' ).split( ',' ) ))
-+			exon_starts = list(map((lambda x: x + tx_start ), exon_starts))
-+			exon_ends = list(map( int, fields[10].rstrip( ',\n' ).split( ',' ) ))
-+			exon_ends = list(map((lambda x, y: x + y ), exon_starts, exon_ends));   
- 			intron_start = exon_ends[:-1]
- 			intron_end=exon_starts[1:]
- 			for st,end in zip (intron_start, intron_end):
- 				knownSpliceSites.add(chrom + ":" + str(st) + "-" + str(end))
--		print >>sys.stderr,"Done! Total "+str(len(knownSpliceSites)) + " known splicing sites"
-+		print("Done! Total "+str(len(knownSpliceSites)) + " known splicing sites", file=sys.stderr)
- 
- 
- 		#read SAM file
-@@ -1842,7 +1842,7 @@ class QCSAM:
- 		intron_start=[]
- 		intron_end=[]
- 		uniqSpliceSites=collections.defaultdict(int)
--		print >>sys.stderr, "Reading "+ self.fileName + '...',
-+		print("Reading "+ self.fileName + '...', end=' ', file=sys.stderr)
- 		for line in self.f:
- 			if line.startswith("@"):continue
- 			fields=line.rstrip('\n ').split()
-@@ -1883,13 +1883,13 @@ class QCSAM:
- 			for st,end in zip(intron_st, intron_end):
- 				samSpliceSites.append(chrom + ":" + str(st) + "-" + str(end))			
- 		#self.f.seek(0)
--		print >>sys.stderr, "Done"
-+		print("Done", file=sys.stderr)
- 		
- 
- 
--		print >>sys.stderr, "shuffling alignments ...",
-+		print("shuffling alignments ...", end=' ', file=sys.stderr)
- 		random.shuffle(samSpliceSites)
--		print >>sys.stderr, "Done"
-+		print("Done", file=sys.stderr)
- 				
- 		#resampling
- 		SR_num = len(samSpliceSites)
-@@ -1898,7 +1898,7 @@ class QCSAM:
- 		known_junc=[]
- 		all_junc=[]
- 		#=========================sampling uniquely mapped reads from population
--		tmp=range(sample_start,sample_end,sample_step)
-+		tmp=list(range(sample_start,sample_end,sample_step))
- 		tmp.append(100)
- 		for pertl in tmp:	#[5, 10, 15, 20, 25, 30, 35, 40, 45, 50, 55, 60, 65, 70, 75, 80, 85, 90, 95,100]
- 			knownSpliceSites_num = 0
-@@ -1907,26 +1907,26 @@ class QCSAM:
- 			if index_st < 0: index_st = 0
- 			sample_size += index_end -index_st
- 			
--			print >>sys.stderr, "sampling " + str(pertl) +"% (" + str(sample_size) + ") unique splicing alignments ...",
-+			print("sampling " + str(pertl) +"% (" + str(sample_size) + ") unique splicing alignments ...", end=' ', file=sys.stderr)
- 			for i in range(index_st, index_end):
- 				uniqSpliceSites[samSpliceSites[i]] +=1	
--			all_junc.append(str(len(uniqSpliceSites.keys())))
-+			all_junc.append(str(len(list(uniqSpliceSites.keys()))))
- 			for sj in uniqSpliceSites:
- 				if sj in knownSpliceSites and uniqSpliceSites[sj] >= recur:
- 					knownSpliceSites_num +=1
--			print >>sys.stderr, str(knownSpliceSites_num) + " known splicing junctions"
-+			print(str(knownSpliceSites_num) + " known splicing junctions", file=sys.stderr)
- 			known_junc.append(str(knownSpliceSites_num))
- 			
- 		#for j in uniq_SJ:
- 			#print >>OUT, j + "\t" + str(uniq_SJ[j])
--		print >>OUT, "pdf('junction_saturation.pdf')"
--		print >>OUT, "x=c(" + ','.join([str(i) for i in tmp]) + ')'
--		print >>OUT, "y=c(" + ','.join(known_junc) + ')'
--		print >>OUT, "z=c(" + ','.join(all_junc) + ')'
--		print >>OUT, "plot(x,z/1000,xlab='percent of total reads',ylab='Number of splicing junctions (x1000)',type='o',col='blue',ylim=c(%d,%d))" % (int(int(known_junc[0])/1000), int(int(all_junc[-1])/1000))
--		print >>OUT, "points(x,y/1000,type='o',col='red')"
--		print >>OUT, 'legend(5,%d, legend=c("All detected junction","Annotated junction"),col=c("blue","red"),lwd=1,pch=1)' % int(int(all_junc[-1])/1000)
--		print >>OUT, "dev.off()"
-+		print("pdf('junction_saturation.pdf')", file=OUT)
-+		print("x=c(" + ','.join([str(i) for i in tmp]) + ')', file=OUT)
-+		print("y=c(" + ','.join(known_junc) + ')', file=OUT)
-+		print("z=c(" + ','.join(all_junc) + ')', file=OUT)
-+		print("plot(x,z/1000,xlab='percent of total reads',ylab='Number of splicing junctions (x1000)',type='o',col='blue',ylim=c(%d,%d))" % (int(int(known_junc[0])/1000), int(int(all_junc[-1])/1000)), file=OUT)
-+		print("points(x,y/1000,type='o',col='red')", file=OUT)
-+		print('legend(5,%d, legend=c("All detected junction","Annotated junction"),col=c("blue","red"),lwd=1,pch=1)' % int(int(all_junc[-1])/1000), file=OUT)
-+		print("dev.off()", file=OUT)
- 
- 	
- 	def annotate_junction(self,refgene,outfile=None,min_intron=50):
-@@ -1941,7 +1941,7 @@ class QCSAM:
- 			out_file = outfile + ".junction.xls"
- 			out_file2 = outfile + ".junction_plot.r"
- 		if refgene is None:
--			print >>sys.stderr, "You must provide reference gene model in bed format."
-+			print("You must provide reference gene model in bed format.", file=sys.stderr)
- 			sys.exit(1)
- 		OUT = open(out_file,'w')
- 		ROUT = open(out_file2,'w')
-@@ -1955,13 +1955,13 @@ class QCSAM:
- 		known_junc =0
- 		splicing_events=collections.defaultdict(int)	
- 		
--		print >>sys.stderr, "\treading reference bed file: ",refgene, " ... ",
-+		print("\treading reference bed file: ",refgene, " ... ", end=' ', file=sys.stderr)
- 		for line in open(refgene,'r'):
- 			if line.startswith(('#','track','browser')):continue  
-            	# Parse fields from gene tabls
- 			fields = line.split()
- 			if(len(fields)<12):
--				print >>sys.stderr, "Invalid bed line (skipped):",line,
-+				print("Invalid bed line (skipped):",line, end=' ', file=sys.stderr)
- 				continue
- 			chrom     = fields[0].upper()
- 			tx_start = int( fields[1] )
-@@ -1969,19 +1969,19 @@ class QCSAM:
- 			if int(fields[9] ==1):
- 				continue    	
- 			
--			exon_starts = map( int, fields[11].rstrip( ',\n' ).split( ',' ) )
--			exon_starts = map((lambda x: x + tx_start ), exon_starts)
--			exon_ends = map( int, fields[10].rstrip( ',\n' ).split( ',' ) )
--			exon_ends = map((lambda x, y: x + y ), exon_starts, exon_ends);   
-+			exon_starts = list(map( int, fields[11].rstrip( ',\n' ).split( ',' ) ))
-+			exon_starts = list(map((lambda x: x + tx_start ), exon_starts))
-+			exon_ends = list(map( int, fields[10].rstrip( ',\n' ).split( ',' ) ))
-+			exon_ends = list(map((lambda x, y: x + y ), exon_starts, exon_ends));   
- 			intron_start = exon_ends[:-1]
- 			intron_end=exon_starts[1:]
- 			for i_st,i_end in zip (intron_start, intron_end):
- 				refIntronStarts[chrom][i_st] =i_st
- 				refIntronEnds[chrom][i_end] =i_end			
--		print >>sys.stderr,"Done"
-+		print("Done", file=sys.stderr)
- 		
- 		#reading input SAM file
--		print >>sys.stderr, "\tProcessing "+ self.fileName + '...',
-+		print("\tProcessing "+ self.fileName + '...', end=' ', file=sys.stderr)
- 		for line in self.f:
- 			if line.startswith("@"):continue
- 			fields=line.rstrip('\n ').split()
-@@ -2022,25 +2022,25 @@ class QCSAM:
- 			intron_end = blockStart[1:]
- 			for i_st,i_end in zip(intron_st, intron_end):
- 				splicing_events[chrom + ":" + str(i_st) + ":" + str(i_end)] += 1
--				if (refIntronStarts[chrom].has_key(i_st) and refIntronEnds[chrom].has_key(i_end)):
-+				if (i_st in refIntronStarts[chrom] and i_end in refIntronEnds[chrom]):
- 					known_junc +=1																		#known both
--				elif (not refIntronStarts[chrom].has_key(i_st) and not refIntronEnds[chrom].has_key(i_end)):
-+				elif (i_st not in refIntronStarts[chrom] and i_end not in refIntronEnds[chrom]):
- 					novel35_junc +=1																
- 				else:
- 					novel3or5_junc +=1
- 		#self.f.seek(0)
--		print >>sys.stderr, "Done"
-+		print("Done", file=sys.stderr)
- 		
--		print >>ROUT, 'pdf("splicing_events_pie.pdf")'
--		print >>ROUT, "events=c(" + ','.join([str(i*100.0/total_junc) for i in (novel3or5_junc,novel35_junc,known_junc)])+ ')'
--		print >>ROUT, 'pie(events,col=c(2,3,4),init.angle=30,angle=c(60,120,150),density=c(70,70,70),main="splicing events",labels=c("partial_novel %d%%","complete_novel %d%%","known %d%%"))' % (round(novel3or5_junc*100.0/total_junc),round(novel35_junc*100.0/total_junc),round(known_junc*100.0/total_junc))
--		print >>ROUT, "dev.off()"
-+		print('pdf("splicing_events_pie.pdf")', file=ROUT)
-+		print("events=c(" + ','.join([str(i*100.0/total_junc) for i in (novel3or5_junc,novel35_junc,known_junc)])+ ')', file=ROUT)
-+		print('pie(events,col=c(2,3,4),init.angle=30,angle=c(60,120,150),density=c(70,70,70),main="splicing events",labels=c("partial_novel %d%%","complete_novel %d%%","known %d%%"))' % (round(novel3or5_junc*100.0/total_junc),round(novel35_junc*100.0/total_junc),round(known_junc*100.0/total_junc)), file=ROUT)
-+		print("dev.off()", file=ROUT)
- 		
--		print >>sys.stderr, "\n==================================================================="
--		print >>sys.stderr, "Total splicing  Events:\t" + str(total_junc)
--		print >>sys.stderr, "Known Splicing Events:\t" + str(known_junc)
--		print >>sys.stderr, "Partial Novel Splicing Events:\t" + str(novel3or5_junc)
--		print >>sys.stderr, "Novel Splicing Events:\t" + str(novel35_junc)
-+		print("\n===================================================================", file=sys.stderr)
-+		print("Total splicing  Events:\t" + str(total_junc), file=sys.stderr)
-+		print("Known Splicing Events:\t" + str(known_junc), file=sys.stderr)
-+		print("Partial Novel Splicing Events:\t" + str(novel3or5_junc), file=sys.stderr)
-+		print("Novel Splicing Events:\t" + str(novel35_junc), file=sys.stderr)
- 		
- 		#reset variables
- 		total_junc =0
-@@ -2048,34 +2048,34 @@ class QCSAM:
- 		novel3or5_junc =0
- 		known_junc =0
- 		
--		print >>OUT, "chrom\tintron_st(0-based)\tintron_end(1-based)\tread_count\tannotation"
-+		print("chrom\tintron_st(0-based)\tintron_end(1-based)\tread_count\tannotation", file=OUT)
- 		for i in splicing_events:
- 			total_junc += 1
- 			(chrom, i_st, i_end) = i.split(":")
--			print >>OUT, '\t'.join([chrom.replace("CHR","chr"),i_st,i_end]) + '\t' + str(splicing_events[i]) + '\t',
-+			print('\t'.join([chrom.replace("CHR","chr"),i_st,i_end]) + '\t' + str(splicing_events[i]) + '\t', end=' ', file=OUT)
- 			i_st = int(i_st)
- 			i_end = int(i_end)
--			if (refIntronStarts[chrom].has_key(i_st) and refIntronEnds[chrom].has_key(i_end)):
--				print >>OUT, "annotated"
-+			if (i_st in refIntronStarts[chrom] and i_end in refIntronEnds[chrom]):
-+				print("annotated", file=OUT)
- 				known_junc +=1
--			elif (not refIntronStarts[chrom].has_key(i_st) and not refIntronEnds[chrom].has_key(i_end)):
--				print >>OUT, 'complete_novel'
-+			elif (i_st not in refIntronStarts[chrom] and i_end not in refIntronEnds[chrom]):
-+				print('complete_novel', file=OUT)
- 				novel35_junc +=1
- 			else:
--				print >>OUT, 'partial_novel'
-+				print('partial_novel', file=OUT)
- 				novel3or5_junc +=1
- 		
- 		
--		print >>sys.stderr, "\nTotal splicing  Junctions:\t" + str(total_junc)
--		print >>sys.stderr, "Known Splicing Junctions:\t" + str(known_junc)
--		print >>sys.stderr, "Partial Novel Splicing Junctions:\t" + str(novel3or5_junc)
--		print >>sys.stderr, "Novel Splicing Junctions:\t" + str(novel35_junc)
--		print >>sys.stderr, "\n==================================================================="
-+		print("\nTotal splicing  Junctions:\t" + str(total_junc), file=sys.stderr)
-+		print("Known Splicing Junctions:\t" + str(known_junc), file=sys.stderr)
-+		print("Partial Novel Splicing Junctions:\t" + str(novel3or5_junc), file=sys.stderr)
-+		print("Novel Splicing Junctions:\t" + str(novel35_junc), file=sys.stderr)
-+		print("\n===================================================================", file=sys.stderr)
- 		
--		print >>ROUT, 'pdf("splicing_junction_pie.pdf")'
--		print >>ROUT, "junction=c(" + ','.join([str(i*100.0/total_junc) for i in (novel3or5_junc,novel35_junc,known_junc,)])+ ')'
--		print >>ROUT, 'pie(junction,col=c(2,3,4),init.angle=30,angle=c(60,120,150),density=c(70,70,70),main="splicing junctions",labels=c("partial_novel %d%%","complete_novel %d%%","known %d%%"))' % (round(novel3or5_junc*100.0/total_junc),round(novel35_junc*100.0/total_junc),round(known_junc*100.0/total_junc))
--		print >>ROUT, "dev.off()"
-+		print('pdf("splicing_junction_pie.pdf")', file=ROUT)
-+		print("junction=c(" + ','.join([str(i*100.0/total_junc) for i in (novel3or5_junc,novel35_junc,known_junc,)])+ ')', file=ROUT)
-+		print('pie(junction,col=c(2,3,4),init.angle=30,angle=c(60,120,150),density=c(70,70,70),main="splicing junctions",labels=c("partial_novel %d%%","complete_novel %d%%","known %d%%"))' % (round(novel3or5_junc*100.0/total_junc),round(novel35_junc*100.0/total_junc),round(known_junc*100.0/total_junc)), file=ROUT)
-+		print("dev.off()", file=ROUT)
- 		#print >>ROUT, "mat=matrix(c(events,junction),byrow=T,ncol=3)"
- 		#print >>ROUT, 'barplot(mat,beside=T,ylim=c(0,100),names=c("known","partial\nnovel","complete\nnovel"),legend.text=c("splicing events","splicing junction"),ylab="Percent")'
- 
-@@ -2083,7 +2083,7 @@ class QCSAM:
- 		'''calculate mRNA's RPKM value'''
- 		
- 		if refbed is None:
--			print >>sys.stderr,"You must specify a bed file representing gene model\n"
-+			print("You must specify a bed file representing gene model\n", file=sys.stderr)
- 			exit(0)
- 		if outfile is None:
- 			rpkm_file = self.fileName + ".RPKM.xls"
-@@ -2101,7 +2101,7 @@ class QCSAM:
- 		RPKM_head=['chr','start','end','name','score','strand','length','rawCount','RPKM']		
- 	
- 		#read SAM 
--		print >>sys.stderr, "Reading "+ self.fileName + '...',
-+		print("Reading "+ self.fileName + '...', end=' ', file=sys.stderr)
- 		for line in self.f:
- 			if line.startswith("@"):continue
- 			fields=line.rstrip('\n ').split()
-@@ -2131,10 +2131,10 @@ class QCSAM:
- 				else:
- 					ranges[chrom].add_interval( Interval( mid, mid ) )
- 					
--		print >>sys.stderr, "Done"
-+		print("Done", file=sys.stderr)
- 
- 		
--		print >>sys.stderr, "Calculating RPKM ...",
-+		print("Calculating RPKM ...", end=' ', file=sys.stderr)
- 		for line in open(refbed,'r'):
- 			try:
- 				if line.startswith(('#','track','browser')):continue  
-@@ -2145,14 +2145,14 @@ class QCSAM:
- 				tx_end    = int( fields[2] )
- 				geneName      = fields[3]
- 				strand    = fields[5].replace(" ","_")
--				exon_starts = map( int, fields[11].rstrip( ',\n' ).split( ',' ) )
--				exon_starts = map((lambda x: x + tx_start ), exon_starts)
--				exon_ends = map( int, fields[10].rstrip( ',\n' ).split( ',' ) )
--				exon_ends = map((lambda x, y: x + y ), exon_starts, exon_ends)
--				exon_sizes = map(int,fields[10].rstrip(',\n').split(','))
-+				exon_starts = list(map( int, fields[11].rstrip( ',\n' ).split( ',' ) ))
-+				exon_starts = list(map((lambda x: x + tx_start ), exon_starts))
-+				exon_ends = list(map( int, fields[10].rstrip( ',\n' ).split( ',' ) ))
-+				exon_ends = list(map((lambda x, y: x + y ), exon_starts, exon_ends))
-+				exon_sizes = list(map(int,fields[10].rstrip(',\n').split(',')))
- 				key='\t'.join((chrom.lower(),str(tx_start),str(tx_end),geneName,'0',strand))
- 			except:
--				print >>sys.stderr,"[NOTE:input bed must be 12-column] skipped this line: " + line
-+				print("[NOTE:input bed must be 12-column] skipped this line: " + line, file=sys.stderr)
- 				continue
- 			mRNA_count=0	#we need to initializ it to 0 for each gene
- 			mRNA_len=sum(exon_sizes)
-@@ -2164,14 +2164,14 @@ class QCSAM:
- 			mRNAlen_table[key] = mRNA_len
- 			RPKM_table[key] = str(mRNA_RPKM)
- 			rawCount_table[key] = str(mRNA_count)
--		print >>sys.stderr, "Done"
-+		print("Done", file=sys.stderr)
- 		
--		print >>RPKM_OUT, '\t'.join(RPKM_head)
-+		print('\t'.join(RPKM_head), file=RPKM_OUT)
- 		for k in RPKM_table:
--			print >>RPKM_OUT, k + '\t',
--			print >>RPKM_OUT, str(mRNAlen_table[k]) + '\t',
--			print >>RPKM_OUT, str(rawCount_table[k]) + '\t',
--			print >>RPKM_OUT, str(RPKM_table[k]) + '\t'
-+			print(k + '\t', end=' ', file=RPKM_OUT)
-+			print(str(mRNAlen_table[k]) + '\t', end=' ', file=RPKM_OUT)
-+			print(str(rawCount_table[k]) + '\t', end=' ', file=RPKM_OUT)
-+			print(str(RPKM_table[k]) + '\t', file=RPKM_OUT)
- 		return RPKM_table
- 		self.f.seek(0)	
- 
-@@ -2180,10 +2180,10 @@ class QCSAM:
- 		use the parental gene as standard, for spliced read, use the splicing motif as strandard'''
- 		
- 		if refbed is None:
--			print >>sys.stderr,"You must specify a bed file representing gene model\n"
-+			print("You must specify a bed file representing gene model\n", file=sys.stderr)
- 			exit(0)
- 		if genome is None:
--			print >>sys.stderr,"You must specify genome sequence in fasta format\n"
-+			print("You must specify genome sequence in fasta format\n", file=sys.stderr)
- 			exit(0)
- 		
- 		if outfile is None:
-@@ -2191,19 +2191,19 @@ class QCSAM:
- 		else:
- 			strand_file = outfile + ".strand.infor"		
- 		OUT = open(strand_file,'w')
--		print >>OUT,"read_type\tread_id\tread_seq\tchr\tStart\tCigar\tprotocol_strand\tgene_strand"	
-+		print("read_type\tread_id\tread_seq\tchr\tStart\tCigar\tprotocol_strand\tgene_strand", file=OUT)	
- 		
- 		transtab = string.maketrans("ACGTNX","TGCANX")
- 		motif=sp.upper().split(',')
- 		motif_rev = [m.translate(transtab)[::-1] for m in motif]
- 		
- 		#load genome
--		print >>sys.stderr, "\tloading "+genome+'...'
-+		print("\tloading "+genome+'...', file=sys.stderr)
- 		tmp=fasta.Fasta(genome)
- 		
- 		#load reference gene model
- 		gene_ranges={}
--		print >>sys.stderr, "reading reference gene model ...",
-+		print("reading reference gene model ...", end=' ', file=sys.stderr)
- 		for line in open(refbed,'r'):
- 			try:
- 				if line.startswith(('#','track','browser')):continue  
-@@ -2215,12 +2215,12 @@ class QCSAM:
- 				geneName      = fields[3]
- 				strand    = fields[5]
- 			except:
--				print >>sys.stderr,"[NOTE:input bed must be 12-column] skipped this line: " + line
-+				print("[NOTE:input bed must be 12-column] skipped this line: " + line, file=sys.stderr)
- 				continue
- 			if chrom not in gene_ranges:
- 				gene_ranges[chrom]=Intersecter()
- 			gene_ranges[chrom].insert(tx_start,tx_end,strand)							
--		print >>sys.stderr, "Done"		
-+		print("Done", file=sys.stderr)		
- 
- 		#read SAM 
- 		
-@@ -2228,7 +2228,7 @@ class QCSAM:
- 		strand_from_protocol = 'unknown'
- 		strand_from_gene='unknown'
- 		strand_stat=collections.defaultdict(int)
--		print >>sys.stderr, "Reading "+ self.fileName + '...',
-+		print("Reading "+ self.fileName + '...', end=' ', file=sys.stderr)
- 		for line in self.f:
- 			if line.startswith("@"):continue
- 			fields=line.rstrip('\n ').split()
-@@ -2258,9 +2258,9 @@ class QCSAM:
- 					else:
- 						strand_from_gene="intergenic"
- 				
--				print >>OUT,read_type + '\t' + fields[0] + '\t' + fields[9] + '\t' + fields[2] + '\t' + fields[3] + '\t' + fields[5] +'\t',
--				print >>OUT,strand_from_protocol + '\t' + strand_from_gene		  
--		 		strand_stat[read_type + '\t' + strand_from_protocol +'\t' + strand_from_gene] +=1  
-+				print(read_type + '\t' + fields[0] + '\t' + fields[9] + '\t' + fields[2] + '\t' + fields[3] + '\t' + fields[5] +'\t', end=' ', file=OUT)
-+				print(strand_from_protocol + '\t' + strand_from_gene, file=OUT)		  
-+				strand_stat[read_type + '\t' + strand_from_protocol +'\t' + strand_from_gene] +=1  
- 
- 
- 			#for spliced read
-@@ -2273,14 +2273,14 @@ class QCSAM:
- 					blockStart.append(readStart + sum(comb[:i]) )
- 				for i in range(0,len(comb),2):
- 					blockSize.append(comb[i])
--				blockEnd=map((lambda x,y:x+y),blockStart,blockSize)
-+				blockEnd=list(map((lambda x,y:x+y),blockStart,blockSize))
- 				intron_start=blockEnd[:-1]
- 				intron_end=blockStart[1:]
- 				for st,end in zip(intron_start,intron_end):
- 					try:
- 						splice_motif = str(tmp.fetchSeq(chrom, st, st+2)) + str(tmp.fetchSeq(chrom, end-2,end))
- 					except:
--							print line
-+							print(line)
- 					if splice_motif in motif:
- 						splice_strand.append('+')
- 					elif splice_motif in motif_rev:
-@@ -2293,16 +2293,16 @@ class QCSAM:
- 						strand_from_splice = 'unknown motif'
- 				else:
- 						strand_from_splice = set(splice_strand).pop()
--				print >>OUT,read_type + '\t' + fields[0] + '\t' + fields[9] + '\t' + fields[2] + '\t' + fields[3] + '\t' + fields[5] +'\t',
--				print >>OUT,strand_from_protocol + '\t' + strand_from_splice
-+				print(read_type + '\t' + fields[0] + '\t' + fields[9] + '\t' + fields[2] + '\t' + fields[3] + '\t' + fields[5] +'\t', end=' ', file=OUT)
-+				print(strand_from_protocol + '\t' + strand_from_splice, file=OUT)
- 				
- 				strand_stat[read_type + '\t' + strand_from_protocol +'\t' + strand_from_splice] +=1
- 							
--		print >>sys.stderr, "Done"
-+		print("Done", file=sys.stderr)
- 		
--		print "read_type\tstrand_expected\tstrand_observed\tcount"
-+		print("read_type\tstrand_expected\tstrand_observed\tcount")
- 		for i in sorted(strand_stat):
--				print str(i) +'\t' + str(strand_stat[i])
-+				print(str(i) +'\t' + str(strand_stat[i]))
- 		
- 	def clipping_profile(self,outfile=None):
- 		'''calculate profile of soft clipping'''
-@@ -2315,7 +2315,7 @@ class QCSAM:
- 		
- 		OUT=open(out_file1,'w')
- 		ROUT=open(out_file2,'w')
--		print >>OUT, "Position\tRead_Total\tRead_clipped"
-+		print("Position\tRead_Total\tRead_clipped", file=OUT)
- 		soft_p = re.compile(r'(.*?)(\d+)S')
- 		read_part = re.compile(r'(\d+)[MIS=X]')
- 		total_read =0
-@@ -2324,7 +2324,7 @@ class QCSAM:
- 		
- 		read_pos=[]
- 		clip_count=[]
--		print >>sys.stderr, "Reading "+ self.fileName + '...'
-+		print("Reading "+ self.fileName + '...', file=sys.stderr)
- 		for line in self.f:
- 			if line.startswith("@"):continue
- 			fields=line.rstrip('\n ').split()
-@@ -2349,12 +2349,12 @@ class QCSAM:
- 		for i in soft_clip_profile:
- 			read_pos.append(str(i))
- 			clip_count.append(str(soft_clip_profile[i]))
--			print >>OUT, str(i) + '\t' + str(total_read) + '\t' + str(soft_clip_profile[i])
--		print >>ROUT, "pdf('clipping_profile.pdf')"
--		print >>ROUT, "read_pos=c(" + ','.join(read_pos) + ')'
--		print >>ROUT, "count=c(" + ','.join(clip_count) + ')'
--		print >>ROUT, 'plot(read_pos,1-(count/%d),col="blue",main="clipping profile",xlab="Position of reads",ylab="Mappability",type="b")' % total_read
--		print >>ROUT, "dev.off()"
-+			print(str(i) + '\t' + str(total_read) + '\t' + str(soft_clip_profile[i]), file=OUT)
-+		print("pdf('clipping_profile.pdf')", file=ROUT)
-+		print("read_pos=c(" + ','.join(read_pos) + ')', file=ROUT)
-+		print("count=c(" + ','.join(clip_count) + ')', file=ROUT)
-+		print('plot(read_pos,1-(count/%d),col="blue",main="clipping profile",xlab="Position of reads",ylab="Mappability",type="b")' % total_read, file=ROUT)
-+		print("dev.off()", file=ROUT)
- 		
- 	def insertion_profile(self,read_len,outfile=None):
- 		'''calculate profile of insertion (insertion means insertion to the reference)'''
-@@ -2367,13 +2367,13 @@ class QCSAM:
- 		
- 		OUT=open(out_file1,'w')
- 		ROUT=open(out_file2,'w')
--		print >>OUT, "Position\tRead_Total\tRead_clipped"
-+		print("Position\tRead_Total\tRead_clipped", file=OUT)
- 		soft_p = re.compile(r'(.*?)(\d+)I')
- 		read_part = re.compile(r'(\d+)[MIS=X]')
- 		total_read =0
- 		skip_part_of_read =0
- 		soft_clip_profile=collections.defaultdict(int)
--		print >>sys.stderr, "Reading "+ self.fileName + '...',
-+		print("Reading "+ self.fileName + '...', end=' ', file=sys.stderr)
- 		for line in self.f:
- 			if line.startswith("@"):continue
- 			fields=line.rstrip('\n ').split()
-@@ -2396,7 +2396,7 @@ class QCSAM:
- 						soft_clip_profile[n]+=1
- 					skip_part_of_read += int(j[1])
- 		for i in range(0,read_len):
--			print >>OUT, str(i) + '\t' + str(total_read) + '\t' + str(soft_clip_profile[i])
-+			print(str(i) + '\t' + str(total_read) + '\t' + str(soft_clip_profile[i]), file=OUT)
- 
- class ParseBAM:
- 	'''This class provides fuctions to parsing/processing/transforming SAM or BAM files. The input
-@@ -2408,13 +2408,13 @@ class ParseBAM:
- 		try:
- 			self.samfile = pysam.Samfile(inputFile,'rb')
- 			if len(self.samfile.header) ==0:
--				print >>sys.stderr, "BAM/SAM file has no header section. Exit!"
-+				print("BAM/SAM file has no header section. Exit!", file=sys.stderr)
- 				sys.exit(1)
- 			self.bam_format = True
- 		except:
- 			self.samfile = pysam.Samfile(inputFile,'r')
- 			if len(self.samfile.header) ==0:
--				print >>sys.stderr, "BAM/SAM file has no header section. Exit!"
-+				print("BAM/SAM file has no header section. Exit!", file=sys.stderr)
- 				sys.exit(1)
- 			self.bam_format = False
- 
-@@ -2437,13 +2437,13 @@ class ParseBAM:
- 		R_splice=0
- 		R_properPair =0 
- 
--		if self.bam_format:print >>sys.stderr, "Load BAM file ... ",
--		else:print >>sys.stderr, "Load SAM file ... ",
-+		if self.bam_format:print("Load BAM file ... ", end=' ', file=sys.stderr)
-+		else:print("Load SAM file ... ", end=' ', file=sys.stderr)
- 
- 		try:
- 			while(1):
- 				flag=0
--				aligned_read = self.samfile.next()
-+				aligned_read = next(self.samfile)
- 				R_total +=1
- 				if aligned_read.is_qcfail:			#skip QC fail read
- 					R_qc_fail +=1
-@@ -2487,26 +2487,26 @@ class ParseBAM:
- 						R_properPair +=1
- 				
- 		except StopIteration:
--			print >>sys.stderr, "Done"		
-+			print("Done", file=sys.stderr)		
- 		#self.samfile.seek(current_pos)
- 				
--		print >>sys.stderr,"\n#=================================================="
--		print >>sys.stderr, "%-30s%d" % ("Total Reads (Records):",R_total)
--		print >>sys.stderr, "\n",
--		print >>sys.stderr, "%-30s%d" % ("QC failed:",R_qc_fail)
--		print >>sys.stderr, "%-30s%d" % ("Optical/PCR duplicate:", R_duplicate)
--		print >>sys.stderr, "%-30s%d" % ("Non Primary Hits", R_nonprimary)
--		print >>sys.stderr, "%-30s%d" % ("Unmapped reads:",R_unmap)
--		print >>sys.stderr, "%-30s%d" % ("Multiple mapped reads:",R_multipleHit)
--		print >>sys.stderr, "\n",
--		print >>sys.stderr, "%-30s%d" % ("Uniquely mapped:",R_uniqHit)
--		print >>sys.stderr, "%-30s%d" % ("Read-1:",R_read1)
--		print >>sys.stderr, "%-30s%d" % ("Read-2:",R_read2)
--		print >>sys.stderr, "%-30s%d" % ("Reads map to '+':",R_forward)
--		print >>sys.stderr, "%-30s%d" % ("Reads map to '-':",R_reverse)
--		print >>sys.stderr, "%-30s%d" % ("Non-splice reads:",R_nonSplice)
--		print >>sys.stderr, "%-30s%d" % ("Splice reads:",R_splice)	
--		print >>sys.stderr, "%-30s%d" % ("Reads mapped in proper pairs:",R_properPair)
-+		print("\n#==================================================", file=sys.stderr)
-+		print("%-30s%d" % ("Total Reads (Records):",R_total), file=sys.stderr)
-+		print("\n", end=' ', file=sys.stderr)
-+		print("%-30s%d" % ("QC failed:",R_qc_fail), file=sys.stderr)
-+		print("%-30s%d" % ("Optical/PCR duplicate:", R_duplicate), file=sys.stderr)
-+		print("%-30s%d" % ("Non Primary Hits", R_nonprimary), file=sys.stderr)
-+		print("%-30s%d" % ("Unmapped reads:",R_unmap), file=sys.stderr)
-+		print("%-30s%d" % ("Multiple mapped reads:",R_multipleHit), file=sys.stderr)
-+		print("\n", end=' ', file=sys.stderr)
-+		print("%-30s%d" % ("Uniquely mapped:",R_uniqHit), file=sys.stderr)
-+		print("%-30s%d" % ("Read-1:",R_read1), file=sys.stderr)
-+		print("%-30s%d" % ("Read-2:",R_read2), file=sys.stderr)
-+		print("%-30s%d" % ("Reads map to '+':",R_forward), file=sys.stderr)
-+		print("%-30s%d" % ("Reads map to '-':",R_reverse), file=sys.stderr)
-+		print("%-30s%d" % ("Non-splice reads:",R_nonSplice), file=sys.stderr)
-+		print("%-30s%d" % ("Splice reads:",R_splice), file=sys.stderr)	
-+		print("%-30s%d" % ("Reads mapped in proper pairs:",R_properPair), file=sys.stderr)
- 	
- 	def configure_experiment(self,refbed,sample_size = 200000):
- 		'''Given a BAM/SAM file, this function will try to guess the RNA-seq experiment:
-@@ -2521,7 +2521,7 @@ class ParseBAM:
- 		s_strandness=collections.defaultdict(int)
- 		#load reference gene model
- 		gene_ranges={}
--		print >>sys.stderr, "Reading reference gene model " + refbed + ' ...',
-+		print("Reading reference gene model " + refbed + ' ...', end=' ', file=sys.stderr)
- 		for line in open(refbed,'r'):
- 			try:
- 				if line.startswith(('#','track','browser')):continue  
-@@ -2533,22 +2533,22 @@ class ParseBAM:
- 				geneName      = fields[3]
- 				strand    = fields[5]
- 			except:
--				print >>sys.stderr,"[NOTE:input bed must be 12-column] skipped this line: " + line
-+				print("[NOTE:input bed must be 12-column] skipped this line: " + line, file=sys.stderr)
- 				continue
- 			if chrom not in gene_ranges:
- 				gene_ranges[chrom]=Intersecter()
- 			gene_ranges[chrom].insert(tx_start,tx_end,strand)							
--		print >>sys.stderr, "Done"		
-+		print("Done", file=sys.stderr)		
- 		
- 		#read SAM/BAM file
- 		#current_pos = self.samfile.tell()
--		print >>sys.stderr, "Loading SAM/BAM file ... ",
-+		print("Loading SAM/BAM file ... ", end=' ', file=sys.stderr)
- 		try:
- 			while(1):
- 				if count >= sample_size:
- 					break
- 				flag=0
--				aligned_read = self.samfile.next()
-+				aligned_read = next(self.samfile)
- 				if aligned_read.is_qcfail:			#skip low quanlity
- 					continue
- 				if aligned_read.is_duplicate:		#skip duplicate read
-@@ -2596,10 +2596,10 @@ class ParseBAM:
- 							count += 1
- 
- 		except StopIteration:
--			print >>sys.stderr, "Finished"		
-+			print("Finished", file=sys.stderr)		
- 		#self.samfile.seek(current_pos)
- 		
--		print >>sys.stderr, "Total " + str(count) + " usable reads were sampled"
-+		print("Total " + str(count) + " usable reads were sampled", file=sys.stderr)
- 		protocol="unknown"
- 		strandness=None
- 		spec1=0.0
-@@ -2640,7 +2640,7 @@ class ParseBAM:
- 		elif len(strand_rule.split(',')) ==2:									#singeEnd, strand-specific
- 			for i in strand_rule.split(','):strandRule[i[0]]=i[1]
- 		else:
--			print >>sys.stderr, "Unknown value of option :'strand_rule' " + strand_rule
-+			print("Unknown value of option :'strand_rule' " + strand_rule, file=sys.stderr)
- 			sys.exit(1)
- 		if len(strandRule) == 0:
- 			FWO = open(outfile + '.wig','w')
-@@ -2650,13 +2650,13 @@ class ParseBAM:
- 		
- 		
- 		read_id=''
--		for chr_name, chr_size in chrom_sizes.items():		#iterate each chrom
-+		for chr_name, chr_size in list(chrom_sizes.items()):		#iterate each chrom
- 			try:
- 				self.samfile.fetch(chr_name,0,chr_size)
- 			except:
--				print >>sys.stderr, "No alignments for " + chr_name + '. skipped'
-+				print("No alignments for " + chr_name + '. skipped', file=sys.stderr)
- 				continue
--			print >>sys.stderr, "Processing " + chr_name + " ..."
-+			print("Processing " + chr_name + " ...", file=sys.stderr)
- 			if len(strandRule) == 0: FWO.write('variableStep chrom='+chr_name+'\n')
- 			else:
- 				FWO.write('variableStep chrom='+chr_name+'\n')
-@@ -2699,12 +2699,12 @@ class ParseBAM:
- 					
- 			if len(strandRule) == 0:							#this is NOT strand specific.
- 				for pos in sorted (Fwig.keys()):
--					print >>FWO, "%d\t%.2f" % (pos,Fwig[pos])
-+					print("%d\t%.2f" % (pos,Fwig[pos]), file=FWO)
- 			else:
- 				for pos in sorted (Fwig.keys()):
--					print >>FWO, "%d\t%.2f" % (pos,Fwig[pos])
-+					print("%d\t%.2f" % (pos,Fwig[pos]), file=FWO)
- 				for pos in sorted (Rwig.keys()):
--					print >>RVO, "%d\t%.2f" % (pos,Rwig[pos])
-+					print("%d\t%.2f" % (pos,Rwig[pos]), file=RVO)
- 				
- 					
- 	def calculate_rpkm(self,geneFile,outfile,strand_rule=None):
-@@ -2732,7 +2732,7 @@ class ParseBAM:
- 		elif len(strand_rule.split(',')) ==2:									#singeEnd, strand-specific
- 			for i in strand_rule.split(','):strandRule[i[0]]=i[1]
- 		else:
--			print >>sys.stderr, "Unknown value of option :'strand_rule' " + strand_rule
-+			print("Unknown value of option :'strand_rule' " + strand_rule, file=sys.stderr)
- 			sys.exit(1)
- 		
- 		uniq_read=0
-@@ -2744,14 +2744,14 @@ class ParseBAM:
- 		rpkm_value={}
- 		
- 		RPKM_OUT = open(outfile,'w')
--		if self.bam_format:print >>sys.stderr, "Load BAM file ... ",
--		else:print >>sys.stderr, "Load SAM file ... ",
-+		if self.bam_format:print("Load BAM file ... ", end=' ', file=sys.stderr)
-+		else:print("Load SAM file ... ", end=' ', file=sys.stderr)
- 		
- 		#current_pos = self.samfile.tell()
- 		try:
- 			while(1):
- 				flag=0
--				aligned_read = self.samfile.next()
-+				aligned_read = next(self.samfile)
- 				if aligned_read.is_qcfail:continue			#skip low quanlity					
- 				if aligned_read.is_duplicate:continue		#skip duplicate read
- 				if aligned_read.is_secondary:continue		#skip non primary hit
-@@ -2801,11 +2801,11 @@ class ParseBAM:
- 						else:unstrand_ranges[chrom].add_interval( Interval( mid,mid+1 ) )
- 					
- 		except StopIteration:
--			print >>sys.stderr, "Done"
-+			print("Done", file=sys.stderr)
- 		#self.samfile.seek(current_pos)
--		print >>RPKM_OUT, "#Total uniquely mapped reads = " + str(uniq_read)
--		print >>RPKM_OUT, "#Total fragments = " + str(total_tags)
--		print >>sys.stderr, "Assign reads to "+ geneFile + '...',
-+		print("#Total uniquely mapped reads = " + str(uniq_read), file=RPKM_OUT)
-+		print("#Total fragments = " + str(total_tags), file=RPKM_OUT)
-+		print("Assign reads to "+ geneFile + '...', end=' ', file=sys.stderr)
- 		for line in open(geneFile,'r'):
- 			try:
- 				if line.startswith('#'):continue
-@@ -2819,16 +2819,16 @@ class ParseBAM:
- 				geneName      = fields[3]
- 				strand    = fields[5].replace(" ","_")
- 				
--				exon_starts = map( int, fields[11].rstrip( ',\n' ).split( ',' ) )
--				exon_starts = map((lambda x: x + tx_start ), exon_starts)
--				exon_ends = map( int, fields[10].rstrip( ',\n' ).split( ',' ) )
--				exon_ends = map((lambda x, y: x + y ), exon_starts, exon_ends)
--				exon_sizes = map(int,fields[10].rstrip(',\n').split(','))
-+				exon_starts = list(map( int, fields[11].rstrip( ',\n' ).split( ',' ) ))
-+				exon_starts = list(map((lambda x: x + tx_start ), exon_starts))
-+				exon_ends = list(map( int, fields[10].rstrip( ',\n' ).split( ',' ) ))
-+				exon_ends = list(map((lambda x, y: x + y ), exon_starts, exon_ends))
-+				exon_sizes = list(map(int,fields[10].rstrip(',\n').split(',')))
- 				intron_starts = exon_ends[:-1]
- 				intron_ends=exon_starts[1:]
- 				key='\t'.join((chrom.lower(),str(tx_start),str(tx_end),geneName,'0',strand))
- 			except:
--				print >>sys.stderr,"[NOTE:input bed must be 12-column] skipped this line: " + line,
-+				print("[NOTE:input bed must be 12-column] skipped this line: " + line, end=' ', file=sys.stderr)
- 				continue
- 
- 					
-@@ -2892,7 +2892,7 @@ class ParseBAM:
- 					RPKM_OUT.write(chrom.lower() + "\t" + str(tx_start) + "\t" + str(tx_end) + "\t" + geneName + "_mRNA" + "\t" + str(mRNA_count) + "\t" + strand + '\t' +  str(mRNA_count*1000000000.0/(mRNA_len*total_tags)) +'\n')
- 				except:
- 					RPKM_OUT.write(chrom.lower() + "\t" + str(tx_start) + "\t" + str(tx_end) + "\t" + geneName + "_mRNA" + "\t" + str(0) + "\t" + strand + '\t' +  str(0) +'\n')
--		print >>sys.stderr, "Done"
-+		print("Done", file=sys.stderr)
- 
- 	def readsNVC(self,outfile=None,nx=True):
- 		'''for each read, calculate nucleotide frequency vs position'''
-@@ -2914,12 +2914,12 @@ class ParseBAM:
- 		t_count=[]
- 		n_count=[]
- 		x_count=[]
--		if self.bam_format:print >>sys.stderr, "Load BAM file ... ",
--		else:print >>sys.stderr, "Load SAM file ... ",
-+		if self.bam_format:print("Load BAM file ... ", end=' ', file=sys.stderr)
-+		else:print("Load SAM file ... ", end=' ', file=sys.stderr)
- 
- 		try:
- 			while(1):
--				aligned_read = self.samfile.next()
-+				aligned_read = next(self.samfile)
- 				#if aligned_read.is_unmapped:continue	#skip unmapped read
- 				#if aligned_read.is_qcfail:continue	#skip low quality
- 				RNA_read = aligned_read.seq.upper()		
-@@ -2929,62 +2929,62 @@ class ParseBAM:
- 					key = str(i) + j
- 					base_freq[key] += 1
- 		except StopIteration:
--			print >>sys.stderr, "Done"
-+			print("Done", file=sys.stderr)
- 		
--		print >>sys.stderr, "generating data matrix ..."
--		print >>FO, "Position\tA\tC\tG\tT\tN\tX"
--		for i in xrange(len(RNA_read)):
--			print  >>FO, str(i) + '\t',
--			print  >>FO, str(base_freq[str(i) + "A"]) + '\t',
-+		print("generating data matrix ...", file=sys.stderr)
-+		print("Position\tA\tC\tG\tT\tN\tX", file=FO)
-+		for i in range(len(RNA_read)):
-+			print(str(i) + '\t', end=' ', file=FO)
-+			print(str(base_freq[str(i) + "A"]) + '\t', end=' ', file=FO)
- 			a_count.append(str(base_freq[str(i) + "A"]))
--			print  >>FO, str(base_freq[str(i) + "C"]) + '\t',
-+			print(str(base_freq[str(i) + "C"]) + '\t', end=' ', file=FO)
- 			c_count.append(str(base_freq[str(i) + "C"]))
--			print  >>FO, str(base_freq[str(i) + "G"]) + '\t',
-+			print(str(base_freq[str(i) + "G"]) + '\t', end=' ', file=FO)
- 			g_count.append(str(base_freq[str(i) + "G"]))
--			print  >>FO, str(base_freq[str(i) + "T"]) + '\t',
-+			print(str(base_freq[str(i) + "T"]) + '\t', end=' ', file=FO)
- 			t_count.append(str(base_freq[str(i) + "T"]))
--			print  >>FO, str(base_freq[str(i) + "N"]) + '\t',
-+			print(str(base_freq[str(i) + "N"]) + '\t', end=' ', file=FO)
- 			n_count.append(str(base_freq[str(i) + "N"]))
--			print  >>FO, str(base_freq[str(i) + "X"]) + '\t'
-+			print(str(base_freq[str(i) + "X"]) + '\t', file=FO)
- 			x_count.append(str(base_freq[str(i) + "X"]))
- 		FO.close()
- 		
- 		#generating R scripts
--		print >>sys.stderr, "generating R script  ..."
--		print >>RS, "position=c(" + ','.join([str(i) for i in xrange(len(RNA_read))]) + ')'
--		print >>RS, "A_count=c(" + ','.join(a_count) + ')'
--		print >>RS, "C_count=c(" + ','.join(c_count) + ')'
--		print >>RS, "G_count=c(" + ','.join(g_count) + ')'
--		print >>RS, "T_count=c(" + ','.join(t_count) + ')'
--		print >>RS, "N_count=c(" + ','.join(n_count) + ')'
--		print >>RS, "X_count=c(" + ','.join(x_count) + ')'
-+		print("generating R script  ...", file=sys.stderr)
-+		print("position=c(" + ','.join([str(i) for i in range(len(RNA_read))]) + ')', file=RS)
-+		print("A_count=c(" + ','.join(a_count) + ')', file=RS)
-+		print("C_count=c(" + ','.join(c_count) + ')', file=RS)
-+		print("G_count=c(" + ','.join(g_count) + ')', file=RS)
-+		print("T_count=c(" + ','.join(t_count) + ')', file=RS)
-+		print("N_count=c(" + ','.join(n_count) + ')', file=RS)
-+		print("X_count=c(" + ','.join(x_count) + ')', file=RS)
- 		
- 		if nx:
--			print >>RS, "total= A_count + C_count + G_count + T_count + N_count + X_count"
--			print >>RS, "ym=max(A_count/total,C_count/total,G_count/total,T_count/total,N_count/total,X_count/total) + 0.05"
--			print >>RS, "yn=min(A_count/total,C_count/total,G_count/total,T_count/total,N_count/total,X_count/total)"
-+			print("total= A_count + C_count + G_count + T_count + N_count + X_count", file=RS)
-+			print("ym=max(A_count/total,C_count/total,G_count/total,T_count/total,N_count/total,X_count/total) + 0.05", file=RS)
-+			print("yn=min(A_count/total,C_count/total,G_count/total,T_count/total,N_count/total,X_count/total)", file=RS)
- 			
--			print >>RS, 'pdf(\"%s\")' % (outfile +".NVC_plot.pdf")
--			print >>RS, 'plot(position,A_count/total,type="o",pch=20,ylim=c(yn,ym),col="dark green",xlab="Position of Read",ylab="Nucleotide Frequency")'
--			print >>RS, 'lines(position,T_count/total,type="o",pch=20,col="red")'
--			print >>RS, 'lines(position,G_count/total,type="o",pch=20,col="blue")'
--			print >>RS, 'lines(position,C_count/total,type="o",pch=20,col="cyan")'
--			print >>RS, 'lines(position,N_count/total,type="o",pch=20,col="black")'		
--			print >>RS, 'lines(position,X_count/total,type="o",pch=20,col="grey")'	
--			print >>RS, 'legend('+ str(len(RNA_read)-10) + ',ym,legend=c("A","T","G","C","N","X"),col=c("dark green","red","blue","cyan","black","grey"),lwd=2,pch=20,text.col=c("dark green","red","blue","cyan","black","grey"))'
--			print >>RS, "dev.off()"
-+			print('pdf(\"%s\")' % (outfile +".NVC_plot.pdf"), file=RS)
-+			print('plot(position,A_count/total,type="o",pch=20,ylim=c(yn,ym),col="dark green",xlab="Position of Read",ylab="Nucleotide Frequency")', file=RS)
-+			print('lines(position,T_count/total,type="o",pch=20,col="red")', file=RS)
-+			print('lines(position,G_count/total,type="o",pch=20,col="blue")', file=RS)
-+			print('lines(position,C_count/total,type="o",pch=20,col="cyan")', file=RS)
-+			print('lines(position,N_count/total,type="o",pch=20,col="black")', file=RS)		
-+			print('lines(position,X_count/total,type="o",pch=20,col="grey")', file=RS)	
-+			print('legend('+ str(len(RNA_read)-10) + ',ym,legend=c("A","T","G","C","N","X"),col=c("dark green","red","blue","cyan","black","grey"),lwd=2,pch=20,text.col=c("dark green","red","blue","cyan","black","grey"))', file=RS)
-+			print("dev.off()", file=RS)
- 		else:
--			print >>RS, "total= A_count + C_count + G_count + T_count"
--			print >>RS, "ym=max(A_count/total,C_count/total,G_count/total,T_count/total) + 0.05"
--			print >>RS, "yn=min(A_count/total,C_count/total,G_count/total,T_count/total)"
-+			print("total= A_count + C_count + G_count + T_count", file=RS)
-+			print("ym=max(A_count/total,C_count/total,G_count/total,T_count/total) + 0.05", file=RS)
-+			print("yn=min(A_count/total,C_count/total,G_count/total,T_count/total)", file=RS)
- 		
--			print >>RS, 'pdf(\"%s\")' % (outfile +".NVC_plot.pdf")
--			print >>RS, 'plot(position,A_count/total,type="o",pch=20,ylim=c(yn,ym),col="dark green",xlab="Position of Read",ylab="Nucleotide Frequency")'
--			print >>RS, 'lines(position,T_count/total,type="o",pch=20,col="red")'
--			print >>RS, 'lines(position,G_count/total,type="o",pch=20,col="blue")'
--			print >>RS, 'lines(position,C_count/total,type="o",pch=20,col="cyan")'
--			print >>RS, 'legend('+ str(len(RNA_read)-10) + ',ym,legend=c("A","T","G","C"),col=c("dark green","red","blue","cyan"),lwd=2,pch=20,text.col=c("dark green","red","blue","cyan"))'
--			print >>RS, "dev.off()"
-+			print('pdf(\"%s\")' % (outfile +".NVC_plot.pdf"), file=RS)
-+			print('plot(position,A_count/total,type="o",pch=20,ylim=c(yn,ym),col="dark green",xlab="Position of Read",ylab="Nucleotide Frequency")', file=RS)
-+			print('lines(position,T_count/total,type="o",pch=20,col="red")', file=RS)
-+			print('lines(position,G_count/total,type="o",pch=20,col="blue")', file=RS)
-+			print('lines(position,C_count/total,type="o",pch=20,col="cyan")', file=RS)
-+			print('legend('+ str(len(RNA_read)-10) + ',ym,legend=c("A","T","G","C"),col=c("dark green","red","blue","cyan"),lwd=2,pch=20,text.col=c("dark green","red","blue","cyan"))', file=RS)
-+			print("dev.off()", file=RS)
- 		
- 		RS.close()
- 		#self.f.seek(0)
-@@ -2995,8 +2995,8 @@ class ParseBAM:
- 		output = outfile + ".qual.r"
- 		FO=open(output,'w')
- 
--		if self.bam_format:print >>sys.stderr, "Load BAM file ... ",
--		else:print >>sys.stderr, "Load SAM file ... ",
-+		if self.bam_format:print("Load BAM file ... ", end=' ', file=sys.stderr)
-+		else:print("Load SAM file ... ", end=' ', file=sys.stderr)
- 
- 		quality = collections.defaultdict(dict)	#read_pos=>quality score=>count
- 		q_max = -1
-@@ -3005,7 +3005,7 @@ class ParseBAM:
- 		i_box={}	#key is read postion,value is 
- 		try:
- 			while(1):
--				aligned_read = self.samfile.next()
-+				aligned_read = next(self.samfile)
- 				
- 				#if aligned_read.is_unmapped:continue	#skip unmapped read
- 				#if aligned_read.is_qcfail:continue		#skip low quality
-@@ -3024,14 +3024,14 @@ class ParseBAM:
- 					except:
- 						quality[i][q] = 1
- 		except StopIteration:
--			print >>sys.stderr, "Done"
-+			print("Done", file=sys.stderr)
- 		
- 		for p in range(0,read_len):
- 			#print str(p) + ':',
- 			val=[]
- 			occurrence=[]
- 			for q in range(q_min,q_max+1):
--				if quality.has_key(p) and quality[p].has_key(q):
-+				if p in quality and q in quality[p]:
- 					val.append(str(q))				
- 					occurrence.append(str(quality[p][q]))	
- 					q_list.append(str(quality[p][q]))
-@@ -3041,21 +3041,21 @@ class ParseBAM:
- 		
- 		
- 		#generate R script for boxplot
--		print >>FO, "pdf(\'%s\')" % (outfile + ".qual.boxplot.pdf")
-+		print("pdf(\'%s\')" % (outfile + ".qual.boxplot.pdf"), file=FO)
- 		for i in sorted(i_box):
--			print >>FO,'p'+str(i) + '<-' + i_box[i]
--		print >>FO, 'boxplot(' + ','.join(['p'+str(i) for i in i_box]) + ',xlab=\"Position of Read(5\'->3\')\",ylab=\"Phred Quality Score\",outline=F' + ')'
--		print >>FO,"dev.off()"
-+			print('p'+str(i) + '<-' + i_box[i], file=FO)
-+		print('boxplot(' + ','.join(['p'+str(i) for i in i_box]) + ',xlab=\"Position of Read(5\'->3\')\",ylab=\"Phred Quality Score\",outline=F' + ')', file=FO)
-+		print("dev.off()", file=FO)
- 		
- 		
- 		#generate R script for heatmap
--		print >>FO, '\n'
--		print >>FO, "pdf(\'%s\')" % (outfile + ".qual.heatmap.pdf")
--		print >>FO, "qual=c(" + ','.join(q_list)  + ')'
--		print >>FO, "mat=matrix(qual,ncol=%s,byrow=F)" % (read_len)
--		print >>FO, 'Lab.palette <- colorRampPalette(c("blue", "orange", "red3","red2","red1","red"), space = "rgb",interpolate=c(\'spline\'))'
--		print >>FO, "heatmap(mat,Rowv=NA,Colv=NA,xlab=\"Position of Read\",ylab=\"Phred Quality Score\",labRow=seq(from=%s,to=%s),col = Lab.palette(256),scale=\"none\" )" % (q_min,q_max)
--		print >>FO, 'dev.off()'
-+		print('\n', file=FO)
-+		print("pdf(\'%s\')" % (outfile + ".qual.heatmap.pdf"), file=FO)
-+		print("qual=c(" + ','.join(q_list)  + ')', file=FO)
-+		print("mat=matrix(qual,ncol=%s,byrow=F)" % (read_len), file=FO)
-+		print('Lab.palette <- colorRampPalette(c("blue", "orange", "red3","red2","red1","red"), space = "rgb",interpolate=c(\'spline\'))', file=FO)
-+		print("heatmap(mat,Rowv=NA,Colv=NA,xlab=\"Position of Read\",ylab=\"Phred Quality Score\",labRow=seq(from=%s,to=%s),col = Lab.palette(256),scale=\"none\" )" % (q_min,q_max), file=FO)
-+		print('dev.off()', file=FO)
- 		
- 		
- 	def readGC(self,outfile=None):
-@@ -3071,12 +3071,12 @@ class ParseBAM:
- 		
- 		gc_hist=collections.defaultdict(int)	#key is GC percent, value is count of reads
- 
--		if self.bam_format:print >>sys.stderr, "Load BAM file ... ",
--		else:print >>sys.stderr, "Load SAM file ... ",
-+		if self.bam_format:print("Load BAM file ... ", end=' ', file=sys.stderr)
-+		else:print("Load SAM file ... ", end=' ', file=sys.stderr)
- 
- 		try:
- 			while(1):
--				aligned_read = self.samfile.next()
-+				aligned_read = next(self.samfile)
- 				if aligned_read.is_unmapped:continue	#skip unmapped read
- 				if aligned_read.is_qcfail:continue		#skip low quality
- 				RNA_read = aligned_read.seq.upper()		
-@@ -3084,19 +3084,19 @@ class ParseBAM:
- 				#print gc_percent
- 				gc_hist[gc_percent] += 1
- 		except StopIteration:
--			print >>sys.stderr, "Done"
-+			print("Done", file=sys.stderr)
- 		
--		print >>sys.stderr, "writing GC content ..."	
--		print >>FO, "GC%\tread_count"
--		for i in gc_hist.keys():
--			print >>FO, i + '\t' + str(gc_hist[i])
-+		print("writing GC content ...", file=sys.stderr)	
-+		print("GC%\tread_count", file=FO)
-+		for i in list(gc_hist.keys()):
-+			print(i + '\t' + str(gc_hist[i]), file=FO)
- 			
--		print >>sys.stderr, "writing R script ..."
--		print >>RS, "pdf(\"%s\")" % (outfile +  ".GC_plot.pdf")
--		print >>RS, 'gc=rep(c(' + ','.join([i for i in gc_hist.keys()]) + '),' + 'times=c(' + ','.join([str(i) for i in gc_hist.values()]) + '))'
--		print >>RS, 'hist(gc,probability=T,breaks=%d,xlab="GC content (%%)",ylab="Density of Reads",border="blue",main="")' % 100
-+		print("writing R script ...", file=sys.stderr)
-+		print("pdf(\"%s\")" % (outfile +  ".GC_plot.pdf"), file=RS)
-+		print('gc=rep(c(' + ','.join([i for i in list(gc_hist.keys())]) + '),' + 'times=c(' + ','.join([str(i) for i in list(gc_hist.values())]) + '))', file=RS)
-+		print('hist(gc,probability=T,breaks=%d,xlab="GC content (%%)",ylab="Density of Reads",border="blue",main="")' % 100, file=RS)
- 		#print >>RS, "lines(density(gc),col='red')"
--		print >>RS ,"dev.off()"		
-+		print("dev.off()", file=RS)		
- 		#self.f.seek(0)
- 
- 
-@@ -3120,13 +3120,13 @@ class ParseBAM:
- 		seqDup_count=collections.defaultdict(int)
- 		posDup_count=collections.defaultdict(int)
- 
--		if self.bam_format:print >>sys.stderr, "Load BAM file ... ",
--		else:print >>sys.stderr, "Load SAM file ... ",
-+		if self.bam_format:print("Load BAM file ... ", end=' ', file=sys.stderr)
-+		else:print("Load SAM file ... ", end=' ', file=sys.stderr)
- 
- 		try:
- 			while(1):
- 				exon_boundary=""
--				aligned_read = self.samfile.next()
-+				aligned_read = next(self.samfile)
- 				if aligned_read.is_unmapped:continue	#skip unmapped read
- 				if aligned_read.is_qcfail:continue		#skip low quality
- 				RNA_read = aligned_read.seq.upper()		
-@@ -3142,40 +3142,40 @@ class ParseBAM:
- 				posDup[key] +=1
- 
- 		except StopIteration:
--			print >>sys.stderr, "Done"
-+			print("Done", file=sys.stderr)
- 
--		print >>sys.stderr, "report duplicte rate based on sequence ..."
--		print >>SEQ, "Occurrence\tUniqReadNumber"
--		for i in seqDup.values():			#key is occurence, value is uniq reads number (based on seq)
-+		print("report duplicte rate based on sequence ...", file=sys.stderr)
-+		print("Occurrence\tUniqReadNumber", file=SEQ)
-+		for i in list(seqDup.values()):			#key is occurence, value is uniq reads number (based on seq)
- 			seqDup_count[i] +=1
--		for k in sorted(seqDup_count.iterkeys()):	
--			print >>SEQ, str(k) +'\t'+ str(seqDup_count[k])
-+		for k in sorted(seqDup_count.keys()):	
-+			print(str(k) +'\t'+ str(seqDup_count[k]), file=SEQ)
- 		SEQ.close()
- 		
--		print >>sys.stderr, "report duplicte rate based on mapping  ..."
--		print >>POS, "Occurrence\tUniqReadNumber"
--		for i in posDup.values():			#key is occurence, value is uniq reads number (based on coord)
-+		print("report duplicte rate based on mapping  ...", file=sys.stderr)
-+		print("Occurrence\tUniqReadNumber", file=POS)
-+		for i in list(posDup.values()):			#key is occurence, value is uniq reads number (based on coord)
- 			posDup_count[i] +=1
--		for k in sorted(posDup_count.iterkeys()):	
--			print >>POS, str(k) +'\t'+ str(posDup_count[k])
-+		for k in sorted(posDup_count.keys()):	
-+			print(str(k) +'\t'+ str(posDup_count[k]), file=POS)
- 		POS.close()
- 		
- 		
--		print >>sys.stderr, "generate R script ..."
--		print >>RS, "pdf(\'%s\')" % (outfile +".DupRate_plot.pdf")
--		print >>RS, "par(mar=c(5,4,4,5),las=0)"
--		print >>RS, "seq_occ=c(" + ','.join([str(i) for i in sorted(seqDup_count.iterkeys()) ]) + ')'
--		print >>RS, "seq_uniqRead=c(" + ','.join([str(seqDup_count[i]) for i in sorted(seqDup_count.iterkeys()) ]) + ')'
--		print >>RS, "pos_occ=c(" + ','.join([str(i) for i in sorted(posDup_count.iterkeys()) ]) + ')'
--		print >>RS, "pos_uniqRead=c(" + ','.join([str(posDup_count[i]) for i in sorted(posDup_count.iterkeys()) ]) + ')'
--		print >>RS, "plot(pos_occ,log10(pos_uniqRead),ylab='Number of Reads (log10)',xlab='Frequency',pch=4,cex=0.8,col='blue',xlim=c(1,%d),yaxt='n')" % up_bound
--		print >>RS, "points(seq_occ,log10(seq_uniqRead),pch=20,cex=0.8,col='red')"
--		print >>RS, 'ym=floor(max(log10(pos_uniqRead)))'
--		print >>RS, "legend(%d,ym,legend=c('Sequence-base','Mapping-base'),col=c('red','blue'),pch=c(4,20))" % max(up_bound-200,1)
--		print >>RS, 'axis(side=2,at=0:ym,labels=0:ym)'
--		print >>RS, 'axis(side=4,at=c(log10(pos_uniqRead[1]),log10(pos_uniqRead[2]),log10(pos_uniqRead[3]),log10(pos_uniqRead[4])), labels=c(round(pos_uniqRead[1]*100/sum(pos_uniqRead)),round(pos_uniqRead[2]*100/sum(pos_uniqRead)),round(pos_uniqRead[3]*100/sum(pos_uniqRead)),round(pos_uniqRead[4]*100/sum(pos_uniqRead))))'
--		print >>RS, 'mtext(4, text = "Reads %", line = 2)'
--		print >>RS, 'dev.off()'
-+		print("generate R script ...", file=sys.stderr)
-+		print("pdf(\'%s\')" % (outfile +".DupRate_plot.pdf"), file=RS)
-+		print("par(mar=c(5,4,4,5),las=0)", file=RS)
-+		print("seq_occ=c(" + ','.join([str(i) for i in sorted(seqDup_count.keys()) ]) + ')', file=RS)
-+		print("seq_uniqRead=c(" + ','.join([str(seqDup_count[i]) for i in sorted(seqDup_count.keys()) ]) + ')', file=RS)
-+		print("pos_occ=c(" + ','.join([str(i) for i in sorted(posDup_count.keys()) ]) + ')', file=RS)
-+		print("pos_uniqRead=c(" + ','.join([str(posDup_count[i]) for i in sorted(posDup_count.keys()) ]) + ')', file=RS)
-+		print("plot(pos_occ,log10(pos_uniqRead),ylab='Number of Reads (log10)',xlab='Frequency',pch=4,cex=0.8,col='blue',xlim=c(1,%d),yaxt='n')" % up_bound, file=RS)
-+		print("points(seq_occ,log10(seq_uniqRead),pch=20,cex=0.8,col='red')", file=RS)
-+		print('ym=floor(max(log10(pos_uniqRead)))', file=RS)
-+		print("legend(%d,ym,legend=c('Sequence-base','Mapping-base'),col=c('red','blue'),pch=c(4,20))" % max(up_bound-200,1), file=RS)
-+		print('axis(side=2,at=0:ym,labels=0:ym)', file=RS)
-+		print('axis(side=4,at=c(log10(pos_uniqRead[1]),log10(pos_uniqRead[2]),log10(pos_uniqRead[3]),log10(pos_uniqRead[4])), labels=c(round(pos_uniqRead[1]*100/sum(pos_uniqRead)),round(pos_uniqRead[2]*100/sum(pos_uniqRead)),round(pos_uniqRead[3]*100/sum(pos_uniqRead)),round(pos_uniqRead[4]*100/sum(pos_uniqRead))))', file=RS)
-+		print('mtext(4, text = "Reads %", line = 2)', file=RS)
-+		print('dev.off()', file=RS)
- 		#self.f.seek(0)
- 
- 	def clipping_profile(self,outfile):
-@@ -3185,7 +3185,7 @@ class ParseBAM:
- 		
- 		OUT=open(out_file1,'w')
- 		ROUT=open(out_file2,'w')
--		print >>OUT, "Position\tRead_Total\tRead_clipped"
-+		print("Position\tRead_Total\tRead_clipped", file=OUT)
- 		soft_p = re.compile(r'(.*?)(\d+)S')
- 		read_part = re.compile(r'(\d+)[MIS=X]')
- 		total_read =0
-@@ -3195,13 +3195,13 @@ class ParseBAM:
- 		read_pos=[]
- 		clip_count=[]
- 
--		if self.bam_format:print >>sys.stderr, "Load BAM file ... ",
--		else:print >>sys.stderr, "Load SAM file ... ",
-+		if self.bam_format:print("Load BAM file ... ", end=' ', file=sys.stderr)
-+		else:print("Load SAM file ... ", end=' ', file=sys.stderr)
- 
- 		try:
- 			while(1):
- 				exon_boundary=""
--				aligned_read = self.samfile.next()
-+				aligned_read = next(self.samfile)
- 				if aligned_read.is_unmapped:continue	#skip unmapped read
- 				if aligned_read.is_qcfail:continue		#skip low quality
- 				
-@@ -3217,24 +3217,24 @@ class ParseBAM:
- 							soft_clip_profile[n]+=1
- 						skip_part_of_read += int(j[1])
- 		except StopIteration:
--			print >>sys.stderr, "Done"
-+			print("Done", file=sys.stderr)
- 			
- 
- 		for i in soft_clip_profile:
- 			read_pos.append(str(i))
- 			clip_count.append(str(soft_clip_profile[i]))
--			print >>OUT, str(i) + '\t' + str(total_read) + '\t' + str(soft_clip_profile[i])
--		print >>ROUT, "pdf('clipping_profile.pdf')"
--		print >>ROUT, "read_pos=c(" + ','.join(read_pos) + ')'
--		print >>ROUT, "count=c(" + ','.join(clip_count) + ')'
--		print >>ROUT, 'plot(read_pos,1-(count/%d),col="blue",main="clipping profile",xlab="Position of reads",ylab="Mappability",type="b")' % total_read
--		print >>ROUT, "dev.off()"
-+			print(str(i) + '\t' + str(total_read) + '\t' + str(soft_clip_profile[i]), file=OUT)
-+		print("pdf('clipping_profile.pdf')", file=ROUT)
-+		print("read_pos=c(" + ','.join(read_pos) + ')', file=ROUT)
-+		print("count=c(" + ','.join(clip_count) + ')', file=ROUT)
-+		print('plot(read_pos,1-(count/%d),col="blue",main="clipping profile",xlab="Position of reads",ylab="Mappability",type="b")' % total_read, file=ROUT)
-+		print("dev.off()", file=ROUT)
- 
- 	def coverageGeneBody(self,refbed,outfile):
- 		'''Calculate reads coverage over gene body, from 5'to 3'. each gene will be equally divided
- 		into 100 regsions'''
- 		if refbed is None:
--			print >>sys.stderr,"You must specify a bed file representing gene model\n"
-+			print("You must specify a bed file representing gene model\n", file=sys.stderr)
- 			exit(0)
- 		OUT1 = open(outfile + ".geneBodyCoverage_plot.r",'w')
- 		OUT2 = open(outfile + ".geneBodyCoverage.txt",'w')
-@@ -3245,12 +3245,12 @@ class ParseBAM:
- 		rpkm={}
- 		
- 		#read SAM 
--		if self.bam_format:print >>sys.stderr, "Load BAM file ... ",
--		else:print >>sys.stderr, "Load SAM file ... ",
-+		if self.bam_format:print("Load BAM file ... ", end=' ', file=sys.stderr)
-+		else:print("Load SAM file ... ", end=' ', file=sys.stderr)
- 
- 		try:
- 			while(1):
--				aligned_read = self.samfile.next()
-+				aligned_read = next(self.samfile)
- 				if aligned_read.is_qcfail:continue			#skip low quanlity					
- 				if aligned_read.is_duplicate:continue		#skip duplicate read
- 				if aligned_read.is_secondary:continue		#skip non primary hit
-@@ -3269,9 +3269,9 @@ class ParseBAM:
- 					else:
- 						ranges[chrom].add_interval( Interval( exon[1], exon[2] ) )
- 		except StopIteration:
--			print >>sys.stderr, "Done"
-+			print("Done", file=sys.stderr)
- 
--		print >>sys.stderr, "calculating coverage over gene body ..."
-+		print("calculating coverage over gene body ...", file=sys.stderr)
- 		coverage=collections.defaultdict(int)
- 		flag=0
- 		for line in open(refbed,'r'):
-@@ -3285,19 +3285,19 @@ class ParseBAM:
- 				geneName      = fields[3]
- 				strand    = fields[5]
- 				
--				exon_starts = map( int, fields[11].rstrip( ',\n' ).split( ',' ) )
--				exon_starts = map((lambda x: x + tx_start ), exon_starts)
--				exon_ends = map( int, fields[10].rstrip( ',\n' ).split( ',' ) )
--				exon_ends = map((lambda x, y: x + y ), exon_starts, exon_ends);   
-+				exon_starts = list(map( int, fields[11].rstrip( ',\n' ).split( ',' ) ))
-+				exon_starts = list(map((lambda x: x + tx_start ), exon_starts))
-+				exon_ends = list(map( int, fields[10].rstrip( ',\n' ).split( ',' ) ))
-+				exon_ends = list(map((lambda x, y: x + y ), exon_starts, exon_ends));   
- 			except:
--				print >>sys.stderr,"[NOTE:input bed must be 12-column] skipped this line: " + line,
-+				print("[NOTE:input bed must be 12-column] skipped this line: " + line, end=' ', file=sys.stderr)
- 				continue
- 			gene_all_base=[]
- 			percentile_base=[]
- 			mRNA_len =0
- 			flag=0
- 			for st,end in zip(exon_starts,exon_ends):
--				gene_all_base.extend(range(st+1,end+1))		#0-based coordinates on genome
-+				gene_all_base.extend(list(range(st+1,end+1)))		#0-based coordinates on genome
- 				mRNA_len = len(gene_all_base)
- 				if mRNA_len <100:
- 					flag=1
-@@ -3314,18 +3314,18 @@ class ParseBAM:
- 					coverage[i] += len(ranges[chrom].find(percentile_base[i], percentile_base[i]+1))
- 		x_coord=[]
- 		y_coord=[]
--		print >>OUT2, "Total reads: " + str(totalReads)
--		print >>OUT2, "Fragment number: " + str(fragment_num)
--		print >>OUT2, "percentile\tcount"
-+		print("Total reads: " + str(totalReads), file=OUT2)
-+		print("Fragment number: " + str(fragment_num), file=OUT2)
-+		print("percentile\tcount", file=OUT2)
- 		for i in coverage:
- 			x_coord.append(str(i))
- 			y_coord.append(str(coverage[i]))
--			print >>OUT2, str(i) + '\t' + str(coverage[i])
--		print >>OUT1, "pdf(\'%s\')" % (outfile + ".geneBodyCoverage.pdf")
--		print >>OUT1, "x=0:100"
--		print >>OUT1, "y=c(" + ','.join(y_coord) + ')'
--		print >>OUT1, "plot(x,y,xlab=\"percentile of gene body (5'->3')\",ylab='read number',type='s')"
--		print >>OUT1, "dev.off()"
-+			print(str(i) + '\t' + str(coverage[i]), file=OUT2)
-+		print("pdf(\'%s\')" % (outfile + ".geneBodyCoverage.pdf"), file=OUT1)
-+		print("x=0:100", file=OUT1)
-+		print("y=c(" + ','.join(y_coord) + ')', file=OUT1)
-+		print("plot(x,y,xlab=\"percentile of gene body (5'->3')\",ylab='read number',type='s')", file=OUT1)
-+		print("dev.off()", file=OUT1)
- 					
- 	def mRNA_inner_distance(self,outfile,refbed,low_bound=0,up_bound=1000,step=10):
- 		'''estimate the inner distance of mRNA pair end fragment. fragment size = insert_size + 2 x read_length'''
-@@ -3342,33 +3342,33 @@ class ParseBAM:
- 		ranges={}
- 		ranges[fchrom]=Intersecter()
- 		
--		window_left_bound = range(low_bound,up_bound,step)
-- 		frag_size=0
-+		window_left_bound = list(range(low_bound,up_bound,step))
-+		frag_size=0
- 		
- 		inner_distance_bitsets=BinnedBitSet()
- 		tmp = BinnedBitSet()
- 		tmp.set_range(0,0)
-- 		pair_num=0.0
-- 		sizes=[]
-- 		counts=[]
-- 		count=0
-- 		
-- 		print >>sys.stderr, "Get intron regions from " + refbed + " ..."
-- 		bed_obj = BED.ParseBED(refbed)
-- 		ref_exons = []
-- 		
-- 		for exn in bed_obj.getExon():
-- 			ref_exons.append([exn[0].upper(), exn[1], exn[2]])
-+		pair_num=0.0
-+		sizes=[]
-+		counts=[]
-+		count=0
-+		
-+		print("Get intron regions from " + refbed + " ...", file=sys.stderr)
-+		bed_obj = BED.ParseBED(refbed)
-+		ref_exons = []
-+		
-+		for exn in bed_obj.getExon():
-+			ref_exons.append([exn[0].upper(), exn[1], exn[2]])
- 		exon_bitsets = binned_bitsets_from_list(ref_exons)		
- 		
--		if self.bam_format:print >>sys.stderr, "Load BAM file ... ",
--		else:print >>sys.stderr, "Load SAM file ... ",
-+		if self.bam_format:print("Load BAM file ... ", end=' ', file=sys.stderr)
-+		else:print("Load SAM file ... ", end=' ', file=sys.stderr)
- 
- 		try:
- 			while(1):
- 				splice_intron_size=0
- 				flag=0
--				aligned_read = self.samfile.next()
-+				aligned_read = next(self.samfile)
- 				if aligned_read.is_qcfail:continue			#skip low quanlity					
- 				if aligned_read.is_duplicate:continue		#skip duplicate read
- 				if aligned_read.is_secondary:continue		#skip non primary hit
-@@ -3430,28 +3430,28 @@ class ParseBAM:
- 					ranges[fchrom].add_interval( Interval( inner_distance-1, inner_distance ) )
- 					
- 		except StopIteration:
--			print >>sys.stderr, "Done"
-+			print("Done", file=sys.stderr)
- 		
- 		
- 		if pair_num==0:
--			print >>sys.stderr, "Cannot find paired reads"
-+			print("Cannot find paired reads", file=sys.stderr)
- 			sys.exit(0)
- 		#print >>FQ, "Total paired read " + str(pair_num)
- 		for st in window_left_bound:
- 			sizes.append(str(st + step/2))
- 			count = str(len(ranges[fchrom].find(st,st + step)))
- 			counts.append(count)
--			print >>FQ, str(st) + '\t' + str(st+step) +'\t' + count		
-+			print(str(st) + '\t' + str(st+step) +'\t' + count, file=FQ)		
- 		
--		print >>RS, "pdf(\'%s\')" % (outfile + ".inner_distance_plot.pdf")
-+		print("pdf(\'%s\')" % (outfile + ".inner_distance_plot.pdf"), file=RS)
- 		#print >>RS, "par(mfrow=c(2,1),cex.main=0.8,cex.lab=0.8,cex.axis=0.8,mar=c(4,4,4,1))"
- 		#print >>RS, 'pie(c(%d,%d,%d),col=rainbow(3),cex=0.5,radius=1,main="Total %d fragments",labels=c("fraSize <= %d\\n(%4.2f%%)","fragSize > %d\\n(%4.2f%%)","%d < fragSize <= %d\\n(%4.2f%%)"), density=rep(80,80,80),angle=c(90,140,170))' % (ultra_low, ultra_high, pair_num -ultra_low -ultra_high, pair_num, low_bound, ultra_low*100/pair_num, up_bound, ultra_high*100/pair_num, low_bound, up_bound, 100-ultra_low*100/pair_num - ultra_high*100/pair_num)
--		print >>RS, 'fragsize=rep(c(' + ','.join(sizes) + '),' + 'times=c(' + ','.join(counts) + '))'
--		print >>RS, 'frag_sd = round(sd(fragsize))'
--		print >>RS, 'frag_mean = round(mean(fragsize))'
--		print >>RS, 'hist(fragsize,probability=T,breaks=%d,xlab="mRNA insert size (bp)",main=paste(c("Mean=",frag_mean,";","SD=",frag_sd),collapse=""),border="blue")' % len(window_left_bound)
--		print >>RS, "lines(density(fragsize,bw=%d),col='red')" % (2*step)
--		print >>RS ,"dev.off()"
-+		print('fragsize=rep(c(' + ','.join(sizes) + '),' + 'times=c(' + ','.join(counts) + '))', file=RS)
-+		print('frag_sd = round(sd(fragsize))', file=RS)
-+		print('frag_mean = round(mean(fragsize))', file=RS)
-+		print('hist(fragsize,probability=T,breaks=%d,xlab="mRNA insert size (bp)",main=paste(c("Mean=",frag_mean,";","SD=",frag_sd),collapse=""),border="blue")' % len(window_left_bound), file=RS)
-+		print("lines(density(fragsize,bw=%d),col='red')" % (2*step), file=RS)
-+		print("dev.off()", file=RS)
- 		FO.close()
- 		FQ.close()
- 		RS.close()
-@@ -3465,7 +3465,7 @@ class ParseBAM:
- 		out_file = outfile + ".junction.xls"
- 		out_file2 = outfile + ".junction_plot.r"
- 		if refgene is None:
--			print >>sys.stderr, "You must provide reference gene model in bed format."
-+			print("You must provide reference gene model in bed format.", file=sys.stderr)
- 			sys.exit(1)
- 		OUT = open(out_file,'w')
- 		ROUT = open(out_file2,'w')
-@@ -3479,13 +3479,13 @@ class ParseBAM:
- 		known_junc =0
- 		splicing_events=collections.defaultdict(int)	
- 		
--		print >>sys.stderr, "Reading reference bed file: ",refgene, " ... ",
-+		print("Reading reference bed file: ",refgene, " ... ", end=' ', file=sys.stderr)
- 		for line in open(refgene,'r'):
- 			if line.startswith(('#','track','browser')):continue  
-            	# Parse fields from gene tabls
- 			fields = line.split()
- 			if(len(fields)<12):
--				print >>sys.stderr, "Invalid bed line (skipped):",line,
-+				print("Invalid bed line (skipped):",line, end=' ', file=sys.stderr)
- 				continue
- 			chrom     = fields[0].upper()
- 			tx_start = int( fields[1] )
-@@ -3493,25 +3493,25 @@ class ParseBAM:
- 			if int(fields[9] ==1):
- 				continue    	
- 			
--			exon_starts = map( int, fields[11].rstrip( ',\n' ).split( ',' ) )
--			exon_starts = map((lambda x: x + tx_start ), exon_starts)
--			exon_ends = map( int, fields[10].rstrip( ',\n' ).split( ',' ) )
--			exon_ends = map((lambda x, y: x + y ), exon_starts, exon_ends);   
-+			exon_starts = list(map( int, fields[11].rstrip( ',\n' ).split( ',' ) ))
-+			exon_starts = list(map((lambda x: x + tx_start ), exon_starts))
-+			exon_ends = list(map( int, fields[10].rstrip( ',\n' ).split( ',' ) ))
-+			exon_ends = list(map((lambda x, y: x + y ), exon_starts, exon_ends));   
- 			intron_start = exon_ends[:-1]
- 			intron_end=exon_starts[1:]
- 			for i_st,i_end in zip (intron_start, intron_end):
- 				refIntronStarts[chrom][i_st] =i_st
- 				refIntronEnds[chrom][i_end] =i_end			
--		print >>sys.stderr,"Done"
-+		print("Done", file=sys.stderr)
- 		
- 		#reading input SAM file
--		if self.bam_format:print >>sys.stderr, "Load BAM file ... ",
--		else:print >>sys.stderr, "Load SAM file ... ",
-+		if self.bam_format:print("Load BAM file ... ", end=' ', file=sys.stderr)
-+		else:print("Load SAM file ... ", end=' ', file=sys.stderr)
- 
- 		try:
- 			while(1):
- 				flag=0
--				aligned_read = self.samfile.next()
-+				aligned_read = next(self.samfile)
- 				if aligned_read.is_qcfail:continue			#skip low quanlity					
- 				if aligned_read.is_duplicate:continue		#skip duplicate read
- 				if aligned_read.is_secondary:continue		#skip non primary hit
-@@ -3534,28 +3534,28 @@ class ParseBAM:
- 					total_junc +=1
- 					if intrn[2] - intrn[1] < min_intron:continue
- 					splicing_events[intrn[0] + ":" + str(intrn[1]) + ":" + str(intrn[2])] += 1
--					if (refIntronStarts[chrom].has_key(intrn[1]) and refIntronEnds[chrom].has_key(intrn[2])):
-+					if (intrn[1] in refIntronStarts[chrom] and intrn[2] in refIntronEnds[chrom]):
- 						known_junc +=1																		#known both
--					elif (not refIntronStarts[chrom].has_key(intrn[1]) and not refIntronEnds[chrom].has_key(intrn[2])):
-+					elif (intrn[1] not in refIntronStarts[chrom] and intrn[2] not in refIntronEnds[chrom]):
- 						novel35_junc +=1																
- 					else:
- 						novel3or5_junc +=1
- 		except StopIteration:
--			print >>sys.stderr, "Done"
-+			print("Done", file=sys.stderr)
- 		
--		print "total = " + str(total_junc)
-+		print("total = " + str(total_junc))
- 		#self.f.seek(0)
- 		
--		print >>ROUT, 'pdf(\"%s\")' % (outfile + ".junction_plot.pdf")
--		print >>ROUT, "events=c(" + ','.join([str(i*100.0/total_junc) for i in (novel3or5_junc,novel35_junc,known_junc)])+ ')'
--		print >>ROUT, 'pie(events,col=c(2,3,4),init.angle=30,angle=c(60,120,150),density=c(70,70,70),main="splicing events",labels=c("partial_novel %d%%","complete_novel %d%%","known %d%%"))' % (round(novel3or5_junc*100.0/total_junc),round(novel35_junc*100.0/total_junc),round(known_junc*100.0/total_junc))
--		print >>ROUT, "dev.off()"
-+		print('pdf(\"%s\")' % (outfile + ".junction_plot.pdf"), file=ROUT)
-+		print("events=c(" + ','.join([str(i*100.0/total_junc) for i in (novel3or5_junc,novel35_junc,known_junc)])+ ')', file=ROUT)
-+		print('pie(events,col=c(2,3,4),init.angle=30,angle=c(60,120,150),density=c(70,70,70),main="splicing events",labels=c("partial_novel %d%%","complete_novel %d%%","known %d%%"))' % (round(novel3or5_junc*100.0/total_junc),round(novel35_junc*100.0/total_junc),round(known_junc*100.0/total_junc)), file=ROUT)
-+		print("dev.off()", file=ROUT)
- 		
--		print >>sys.stderr, "\n==================================================================="
--		print >>sys.stderr, "Total splicing  Events:\t" + str(total_junc)
--		print >>sys.stderr, "Known Splicing Events:\t" + str(known_junc)
--		print >>sys.stderr, "Partial Novel Splicing Events:\t" + str(novel3or5_junc)
--		print >>sys.stderr, "Novel Splicing Events:\t" + str(novel35_junc)
-+		print("\n===================================================================", file=sys.stderr)
-+		print("Total splicing  Events:\t" + str(total_junc), file=sys.stderr)
-+		print("Known Splicing Events:\t" + str(known_junc), file=sys.stderr)
-+		print("Partial Novel Splicing Events:\t" + str(novel3or5_junc), file=sys.stderr)
-+		print("Novel Splicing Events:\t" + str(novel35_junc), file=sys.stderr)
- 		
- 		#reset variables
- 		total_junc =0
-@@ -3563,36 +3563,36 @@ class ParseBAM:
- 		novel3or5_junc =0
- 		known_junc =0
- 		
--		print >>OUT, "chrom\tintron_st(0-based)\tintron_end(1-based)\tread_count\tannotation"
-+		print("chrom\tintron_st(0-based)\tintron_end(1-based)\tread_count\tannotation", file=OUT)
- 		for i in splicing_events:
- 			total_junc += 1
- 			(chrom, i_st, i_end) = i.split(":")
--			print >>OUT, '\t'.join([chrom.replace("CHR","chr"),i_st,i_end]) + '\t' + str(splicing_events[i]) + '\t',
-+			print('\t'.join([chrom.replace("CHR","chr"),i_st,i_end]) + '\t' + str(splicing_events[i]) + '\t', end=' ', file=OUT)
- 			i_st = int(i_st)
- 			i_end = int(i_end)
--			if (refIntronStarts[chrom].has_key(i_st) and refIntronEnds[chrom].has_key(i_end)):
--				print >>OUT, "annotated"
-+			if (i_st in refIntronStarts[chrom] and i_end in refIntronEnds[chrom]):
-+				print("annotated", file=OUT)
- 				known_junc +=1
--			elif (not refIntronStarts[chrom].has_key(i_st) and not refIntronEnds[chrom].has_key(i_end)):
--				print >>OUT, 'complete_novel'
-+			elif (i_st not in refIntronStarts[chrom] and i_end not in refIntronEnds[chrom]):
-+				print('complete_novel', file=OUT)
- 				novel35_junc +=1
- 			else:
--				print >>OUT, 'partial_novel'
-+				print('partial_novel', file=OUT)
- 				novel3or5_junc +=1
- 		
- 		if total_junc ==0:
--			print >>sys.stderr, "No splice read found"
-+			print("No splice read found", file=sys.stderr)
- 			sys.exit(1)
--		print >>sys.stderr, "\nTotal splicing  Junctions:\t" + str(total_junc)
--		print >>sys.stderr, "Known Splicing Junctions:\t" + str(known_junc)
--		print >>sys.stderr, "Partial Novel Splicing Junctions:\t" + str(novel3or5_junc)
--		print >>sys.stderr, "Novel Splicing Junctions:\t" + str(novel35_junc)
--		print >>sys.stderr, "\n==================================================================="
-+		print("\nTotal splicing  Junctions:\t" + str(total_junc), file=sys.stderr)
-+		print("Known Splicing Junctions:\t" + str(known_junc), file=sys.stderr)
-+		print("Partial Novel Splicing Junctions:\t" + str(novel3or5_junc), file=sys.stderr)
-+		print("Novel Splicing Junctions:\t" + str(novel35_junc), file=sys.stderr)
-+		print("\n===================================================================", file=sys.stderr)
- 		
--		print >>ROUT, 'pdf("splicing_junction_pie.pdf")'
--		print >>ROUT, "junction=c(" + ','.join([str(i*100.0/total_junc) for i in (novel3or5_junc,novel35_junc,known_junc,)])+ ')'
--		print >>ROUT, 'pie(junction,col=c(2,3,4),init.angle=30,angle=c(60,120,150),density=c(70,70,70),main="splicing junctions",labels=c("partial_novel %d%%","complete_novel %d%%","known %d%%"))' % (round(novel3or5_junc*100.0/total_junc),round(novel35_junc*100.0/total_junc),round(known_junc*100.0/total_junc))
--		print >>ROUT, "dev.off()"
-+		print('pdf("splicing_junction_pie.pdf")', file=ROUT)
-+		print("junction=c(" + ','.join([str(i*100.0/total_junc) for i in (novel3or5_junc,novel35_junc,known_junc,)])+ ')', file=ROUT)
-+		print('pie(junction,col=c(2,3,4),init.angle=30,angle=c(60,120,150),density=c(70,70,70),main="splicing junctions",labels=c("partial_novel %d%%","complete_novel %d%%","known %d%%"))' % (round(novel3or5_junc*100.0/total_junc),round(novel35_junc*100.0/total_junc),round(known_junc*100.0/total_junc)), file=ROUT)
-+		print("dev.off()", file=ROUT)
- 		#print >>ROUT, "mat=matrix(c(events,junction),byrow=T,ncol=3)"
- 		#print >>ROUT, 'barplot(mat,beside=T,ylim=c(0,100),names=c("known","partial\nnovel","complete\nnovel"),legend.text=c("splicing events","splicing junction"),ylab="Percent")'
- 
-@@ -3601,7 +3601,7 @@ class ParseBAM:
- 		
- 		out_file = outfile + ".junctionSaturation_plot.r"
- 		if refgene is None:
--			print >>sys.stderr, "You must provide reference gene model in bed format."
-+			print("You must provide reference gene model in bed format.", file=sys.stderr)
- 			sys.exit(1)
- 		
- 		OUT = open(out_file,'w')
-@@ -3609,12 +3609,12 @@ class ParseBAM:
- 
- 		#reading reference gene 
- 		knownSpliceSites= set()
--		print >>sys.stderr, "reading reference bed file: ",refgene, " ... ",
-+		print("reading reference bed file: ",refgene, " ... ", end=' ', file=sys.stderr)
- 		for line in open(refgene,'r'):
- 			if line.startswith(('#','track','browser')):continue  
- 			fields = line.split()
- 			if(len(fields)<12):
--				print >>sys.stderr, "Invalid bed line (skipped):",line,
-+				print("Invalid bed line (skipped):",line, end=' ', file=sys.stderr)
- 				continue
- 			chrom     = fields[0].upper()
- 			tx_start = int( fields[1] )
-@@ -3622,15 +3622,15 @@ class ParseBAM:
- 			if int(fields[9] ==1):
- 				continue    	
- 			
--			exon_starts = map( int, fields[11].rstrip( ',\n' ).split( ',' ) )
--			exon_starts = map((lambda x: x + tx_start ), exon_starts)
--			exon_ends = map( int, fields[10].rstrip( ',\n' ).split( ',' ) )
--			exon_ends = map((lambda x, y: x + y ), exon_starts, exon_ends);   
-+			exon_starts = list(map( int, fields[11].rstrip( ',\n' ).split( ',' ) ))
-+			exon_starts = list(map((lambda x: x + tx_start ), exon_starts))
-+			exon_ends = list(map( int, fields[10].rstrip( ',\n' ).split( ',' ) ))
-+			exon_ends = list(map((lambda x, y: x + y ), exon_starts, exon_ends));   
- 			intron_start = exon_ends[:-1]
- 			intron_end=exon_starts[1:]
- 			for st,end in zip (intron_start, intron_end):
- 				knownSpliceSites.add(chrom + ":" + str(st) + "-" + str(end))
--		print >>sys.stderr,"Done! Total "+str(len(knownSpliceSites)) + " known splicing junctions."
-+		print("Done! Total "+str(len(knownSpliceSites)) + " known splicing junctions.", file=sys.stderr)
- 
- 
- 		#read SAM file
-@@ -3639,12 +3639,12 @@ class ParseBAM:
- 		intron_end=[]
- 		uniqSpliceSites=collections.defaultdict(int)
- 
--		if self.bam_format:print >>sys.stderr, "Load BAM file ... ",
--		else:print >>sys.stderr, "Load SAM file ... ",
-+		if self.bam_format:print("Load BAM file ... ", end=' ', file=sys.stderr)
-+		else:print("Load SAM file ... ", end=' ', file=sys.stderr)
- 		try:
- 			while(1):
- 				flag=0
--				aligned_read = self.samfile.next()
-+				aligned_read = next(self.samfile)
- 				if aligned_read.is_qcfail:continue			#skip low quanlity					
- 				if aligned_read.is_duplicate:continue		#skip duplicate read
- 				if aligned_read.is_secondary:continue		#skip non primary hit
-@@ -3667,11 +3667,11 @@ class ParseBAM:
- 					if intrn[2] - intrn[1] < min_intron:continue
- 					samSpliceSites.append(intrn[0] + ":" + str(intrn[1]) + "-" + str(intrn[2]))
- 		except StopIteration:
--			print >>sys.stderr, "Done"
-+			print("Done", file=sys.stderr)
- 		
--		print >>sys.stderr, "shuffling alignments ...",
-+		print("shuffling alignments ...", end=' ', file=sys.stderr)
- 		random.shuffle(samSpliceSites)
--		print >>sys.stderr, "Done"
-+		print("Done", file=sys.stderr)
- 				
- 		#resampling
- 		SR_num = len(samSpliceSites)
-@@ -3681,7 +3681,7 @@ class ParseBAM:
- 		all_junc=[]
- 		unknown_junc=[]
- 		#=========================sampling uniquely mapped reads from population
--		tmp=range(sample_start,sample_end,sample_step)
-+		tmp=list(range(sample_start,sample_end,sample_step))
- 		tmp.append(100)
- 		for pertl in tmp:	#[5, 10, 15, 20, 25, 30, 35, 40, 45, 50, 55, 60, 65, 70, 75, 80, 85, 90, 95,100]
- 			knownSpliceSites_num = 0
-@@ -3690,21 +3690,21 @@ class ParseBAM:
- 			if index_st < 0: index_st = 0
- 			sample_size += index_end -index_st
- 			
--			print >>sys.stderr, "sampling " + str(pertl) +"% (" + str(sample_size) + ") splicing reads.",
-+			print("sampling " + str(pertl) +"% (" + str(sample_size) + ") splicing reads.", end=' ', file=sys.stderr)
- 			
- 			#all splice juntion
- 			for i in range(index_st, index_end):
- 				uniqSpliceSites[samSpliceSites[i]] +=1	
--			all_junctionNum = len(uniqSpliceSites.keys())
-+			all_junctionNum = len(list(uniqSpliceSites.keys()))
- 			all_junc.append(str(all_junctionNum))
--			print >>sys.stderr, str(all_junctionNum) + " splicing junctions.",
-+			print(str(all_junctionNum) + " splicing junctions.", end=' ', file=sys.stderr)
- 			
- 			#known splice junction
- 			known_junctionNum = 0
- 			for sj in uniqSpliceSites:
- 				if sj in knownSpliceSites and uniqSpliceSites[sj] >= recur:
- 					known_junctionNum +=1
--			print >>sys.stderr, str(known_junctionNum) + " known splicing junctions.",
-+			print(str(known_junctionNum) + " known splicing junctions.", end=' ', file=sys.stderr)
- 			known_junc.append(str(known_junctionNum))
- 			
- 			#unknown splice junction
-@@ -3713,28 +3713,28 @@ class ParseBAM:
- 				if sj not in knownSpliceSites:
- 					unknown_junctionNum +=1
- 			unknown_junc.append(str(unknown_junctionNum))
--			print >>sys.stderr, str(unknown_junctionNum) + " novel splicing junctions."
-+			print(str(unknown_junctionNum) + " novel splicing junctions.", file=sys.stderr)
- 			
- 		#for j in uniq_SJ:
- 			#print >>OUT, j + "\t" + str(uniq_SJ[j])
--		print >>OUT, "pdf(\'%s\')" % (outfile + '.junctionSaturation_plot.pdf')
--		print >>OUT, "x=c(" + ','.join([str(i) for i in tmp]) + ')'
--		print >>OUT, "y=c(" + ','.join(known_junc) + ')'
--		print >>OUT, "z=c(" + ','.join(all_junc) + ')'
--		print >>OUT, "w=c(" + ','.join(unknown_junc) + ')'
--		print >>OUT, "m=max(%d,%d,%d)" % (int(int(known_junc[-1])/1000), int(int(all_junc[-1])/1000),int(int(unknown_junc[-1])/1000))
--		print >>OUT, "n=min(%d,%d,%d)" % (int(int(known_junc[0])/1000), int(int(all_junc[0])/1000),int(int(unknown_junc[0])/1000))
--		print >>OUT, "plot(x,z/1000,xlab='percent of total reads',ylab='Number of splicing junctions (x1000)',type='o',col='blue',ylim=c(n,m))"
--		print >>OUT, "points(x,y/1000,type='o',col='red')"
--		print >>OUT, "points(x,w/1000,type='o',col='green')"
--		print >>OUT, 'legend(5,%d, legend=c("All junctions","known junctions", "novel junctions"),col=c("blue","red","green"),lwd=1,pch=1)' % int(int(all_junc[-1])/1000)
--		print >>OUT, "dev.off()"
-+		print("pdf(\'%s\')" % (outfile + '.junctionSaturation_plot.pdf'), file=OUT)
-+		print("x=c(" + ','.join([str(i) for i in tmp]) + ')', file=OUT)
-+		print("y=c(" + ','.join(known_junc) + ')', file=OUT)
-+		print("z=c(" + ','.join(all_junc) + ')', file=OUT)
-+		print("w=c(" + ','.join(unknown_junc) + ')', file=OUT)
-+		print("m=max(%d,%d,%d)" % (int(int(known_junc[-1])/1000), int(int(all_junc[-1])/1000),int(int(unknown_junc[-1])/1000)), file=OUT)
-+		print("n=min(%d,%d,%d)" % (int(int(known_junc[0])/1000), int(int(all_junc[0])/1000),int(int(unknown_junc[0])/1000)), file=OUT)
-+		print("plot(x,z/1000,xlab='percent of total reads',ylab='Number of splicing junctions (x1000)',type='o',col='blue',ylim=c(n,m))", file=OUT)
-+		print("points(x,y/1000,type='o',col='red')", file=OUT)
-+		print("points(x,w/1000,type='o',col='green')", file=OUT)
-+		print('legend(5,%d, legend=c("All junctions","known junctions", "novel junctions"),col=c("blue","red","green"),lwd=1,pch=1)' % int(int(all_junc[-1])/1000), file=OUT)
-+		print("dev.off()", file=OUT)
- 
- 	def saturation_RPKM(self,refbed,outfile,sample_start=5,sample_step=5,sample_end=100,skip_multi=True, strand_rule=None):
- 		'''for each gene, check if its RPKM (epxresion level) has already been saturated or not'''
- 		
- 		if refbed is None:
--			print >>sys.stderr,"You must specify a bed file representing gene model\n"
-+			print("You must specify a bed file representing gene model\n", file=sys.stderr)
- 			exit(0)
- 		rpkm_file = outfile + ".eRPKM.xls"
- 		raw_file = outfile + ".rawCount.xls"
-@@ -3759,17 +3759,17 @@ class ParseBAM:
- 		elif len(strand_rule.split(',')) ==2:									#singeEnd, strand-specific
- 			for i in strand_rule.split(','):strandRule[i[0]]=i[1]
- 		else:
--			print >>sys.stderr, "Unknown value of: 'strand_rule' " +  strand_rule
-+			print("Unknown value of: 'strand_rule' " +  strand_rule, file=sys.stderr)
- 			sys.exit(1)	
- 
- 
- 		#read SAM or BAM
--		if self.bam_format:print >>sys.stderr, "Load BAM file ... ",
--		else:print >>sys.stderr, "Load SAM file ... ",
-+		if self.bam_format:print("Load BAM file ... ", end=' ', file=sys.stderr)
-+		else:print("Load SAM file ... ", end=' ', file=sys.stderr)
- 		try:
- 			while(1):
- 				flag=0
--				aligned_read = self.samfile.next()
-+				aligned_read = next(self.samfile)
- 				if aligned_read.is_qcfail:continue			#skip low quanlity					
- 				if aligned_read.is_duplicate:continue		#skip duplicate read
- 				if aligned_read.is_secondary:continue		#skip non primary hit
-@@ -3812,14 +3812,14 @@ class ParseBAM:
- 					for exn in exon_blocks:
- 						block_list.append(exn[0] + ":" + str(exn[1] + (exn[2]-exn[1])/2 ))
- 		except StopIteration:
--			print >>sys.stderr, "Done"
-+			print("Done", file=sys.stderr)
- 		
- 		
--		print >>sys.stderr, "shuffling alignments ...",
-+		print("shuffling alignments ...", end=' ', file=sys.stderr)
- 		random.shuffle(block_list_plus)
- 		random.shuffle(block_list_minus)
- 		random.shuffle(block_list)
--		print >>sys.stderr, "Done"
-+		print("Done", file=sys.stderr)
- 		
- 		
- 		ranges_plus={}
-@@ -3830,7 +3830,7 @@ class ParseBAM:
- 		rawCount_table=collections.defaultdict(list)
- 		RPKM_head=['#chr','start','end','name','score','strand']
- 
--		tmp=range(sample_start,sample_end,sample_step)
-+		tmp=list(range(sample_start,sample_end,sample_step))
- 		tmp.append(100)
- 		#=========================sampling uniquely mapped reads from population
- 		for pertl in tmp:	#[5, 10, 15, 20, 25, 30, 35, 40, 45, 50, 55, 60, 65, 70, 75, 80, 85, 90, 95,100]
-@@ -3841,27 +3841,27 @@ class ParseBAM:
- 			RPKM_head.append(str(pertl) + '%')
- 			
- 			if strand_rule is not None:
--				print >>sys.stderr, "sampling " + str(pertl) +"% (" + str(int(cUR_plus * percent_end)) + ") forward strand fragments ..."
-+				print("sampling " + str(pertl) +"% (" + str(int(cUR_plus * percent_end)) + ") forward strand fragments ...", file=sys.stderr)
- 				for i in block_list_plus[int(cUR_plus*percent_st):int(cUR_plus*percent_end)]:
- 					(chr,coord) = i.split(':')
- 					if chr not in ranges_plus:ranges_plus[chr] = Intersecter()
- 					else:ranges_plus[chr].add_interval( Interval( int(coord), int(coord)+1 ) )								
- 				
--				print >>sys.stderr, "sampling " + str(pertl) +"% (" + str(int(cUR_minus * percent_end)) + ") reverse strand fragments ..."			
-+				print("sampling " + str(pertl) +"% (" + str(int(cUR_minus * percent_end)) + ") reverse strand fragments ...", file=sys.stderr)			
- 				for i in block_list_minus[int(cUR_minus*percent_st):int(cUR_minus*percent_end)]:
- 					(chr,coord) = i.split(':')
- 					if chr not in ranges_minus:ranges_minus[chr] = Intersecter()				
- 					else:ranges_minus[chr].add_interval( Interval( int(coord), int(coord)+1 ) )						
- 			
- 			else:
--				print >>sys.stderr, "sampling " + str(pertl) +"% (" + str(int(sample_size)) + ") fragments ..."
-+				print("sampling " + str(pertl) +"% (" + str(int(sample_size)) + ") fragments ...", file=sys.stderr)
- 				for i in block_list[int(cUR_num*percent_st):int(cUR_num*percent_end)]:
- 					(chr,coord) = i.split(':')
- 					if chr not in ranges:ranges[chr] = Intersecter()						
- 					else:ranges[chr].add_interval( Interval( int(coord), int(coord)+1 ) )														
- 
- 			#========================= calculating RPKM based on sub-population
--			print >>sys.stderr, "assign reads to transcripts in " + refbed + ' ...'
-+			print("assign reads to transcripts in " + refbed + ' ...', file=sys.stderr)
- 			for line in open(refbed,'r'):
- 				try:
- 					if line.startswith(('#','track','browser')):continue  
-@@ -3872,14 +3872,14 @@ class ParseBAM:
- 					tx_end    = int( fields[2] )
- 					geneName      = fields[3]
- 					strand    = fields[5]
--					exon_starts = map( int, fields[11].rstrip( ',\n' ).split( ',' ) )
--					exon_starts = map((lambda x: x + tx_start ), exon_starts)
--					exon_ends = map( int, fields[10].rstrip( ',\n' ).split( ',' ) )
--					exon_ends = map((lambda x, y: x + y ), exon_starts, exon_ends)
--					exon_sizes = map(int,fields[10].rstrip(',\n').split(','))
-+					exon_starts = list(map( int, fields[11].rstrip( ',\n' ).split( ',' ) ))
-+					exon_starts = list(map((lambda x: x + tx_start ), exon_starts))
-+					exon_ends = list(map( int, fields[10].rstrip( ',\n' ).split( ',' ) ))
-+					exon_ends = list(map((lambda x, y: x + y ), exon_starts, exon_ends))
-+					exon_sizes = list(map(int,fields[10].rstrip(',\n').split(',')))
- 					key='\t'.join((chrom.lower(),str(tx_start),str(tx_end),geneName,'0',strand))
- 				except:
--					print >>sys.stderr,"[NOTE:input bed must be 12-column] skipped this line: " + line
-+					print("[NOTE:input bed must be 12-column] skipped this line: " + line, file=sys.stderr)
- 					continue
- 				mRNA_count=0	#we need to initializ it to 0 for each gene
- 				mRNA_len=sum(exon_sizes)
-@@ -3892,24 +3892,24 @@ class ParseBAM:
- 						if chrom in ranges:
- 							mRNA_count += len(ranges[chrom].find(st,end))
- 				if mRNA_len ==0:
--					print >>sys.stderr, geneName + " has 0 nucleotides. Exit!"
-+					print(geneName + " has 0 nucleotides. Exit!", file=sys.stderr)
- 					sys.exit(1)
- 				if sample_size == 0:
--					print >>sys.stderr, "Too few reads to sample. Exit!"
-+					print("Too few reads to sample. Exit!", file=sys.stderr)
- 					sys.exit(1)
- 				mRNA_RPKM = (mRNA_count * 1000000000.0)/(mRNA_len * sample_size)
- 				RPKM_table[key].append(str(mRNA_RPKM))
- 				rawCount_table[key].append(str(mRNA_count))
--			print >>sys.stderr, ""
-+			print("", file=sys.stderr)
- 
- 		#self.f.seek(0)
--		print >>RPKM_OUT, '\t'.join(RPKM_head)
--		print >>RAW_OUT, '\t'.join(RPKM_head)
-+		print('\t'.join(RPKM_head), file=RPKM_OUT)
-+		print('\t'.join(RPKM_head), file=RAW_OUT)
- 		for key in RPKM_table:
--			print >>RPKM_OUT, key + '\t',
--			print >>RPKM_OUT, '\t'.join(RPKM_table[key])
--			print >>RAW_OUT, key + '\t',
--			print >>RAW_OUT, '\t'.join(rawCount_table[key])		
-+			print(key + '\t', end=' ', file=RPKM_OUT)
-+			print('\t'.join(RPKM_table[key]), file=RPKM_OUT)
-+			print(key + '\t', end=' ', file=RAW_OUT)
-+			print('\t'.join(rawCount_table[key]), file=RAW_OUT)		
- 		
- 	def fetchAlignments(self,chr,st,end):
- 		'''fetch alignment from sorted BAM file based on chr, st, end
-@@ -3927,4 +3927,4 @@ def print_bits_as_bed( bits ):
- 		start = bits.next_set( end )
- 		if start == bits.size: break
- 		end = bits.next_clear( start )
--		print "%d\t%d" % ( start, end )
-+		print("%d\t%d" % ( start, end ))
diff --git a/biology/py-crossmap/files/patch-lib_cmmodule_twoList.py b/biology/py-crossmap/files/patch-lib_cmmodule_twoList.py
deleted file mode 100644
index efbb0c474374..000000000000
--- a/biology/py-crossmap/files/patch-lib_cmmodule_twoList.py
+++ /dev/null
@@ -1,18 +0,0 @@
---- lib/cmmodule/twoList.py.orig	2021-04-04 22:42:53 UTC
-+++ lib/cmmodule/twoList.py
-@@ -5,7 +5,7 @@ from operator import mul,add,sub
- def check_list(v1,v2):
- 	'''check if the length of two list is same'''
- 	if v1.size != v2.size:
--		raise ValueError,"the lenght of both arrays must be the same"
-+		raise ValueError("the length of both arrays must be the same")
- 	pass
- 
- def Add(v1,v2):
-@@ -50,4 +50,4 @@ def Min(v1,v2):
- def euclidean_distance(v1,v2):
- 	'''return euclidean distance'''                                                                                 
- 	check_list(v1,v2)
--	return (sum((v1.__sub__(v2))**2) / v1.size)**0.5
-\ No newline at end of file
-+	return (sum((v1.__sub__(v2))**2) / v1.size)**0.5
diff --git a/biology/py-crossmap/files/patch-setup.py b/biology/py-crossmap/files/patch-setup.py
deleted file mode 100644
index 4fa46ca7cc20..000000000000
--- a/biology/py-crossmap/files/patch-setup.py
+++ /dev/null
@@ -1,10 +0,0 @@
---- setup.py.orig	2021-04-05 15:27:07 UTC
-+++ setup.py
-@@ -11,7 +11,6 @@ def main():
-     setup(  name = "CrossMap",
-             version = "0.5.2",
-             python_requires='>=3.5',
--            py_modules = [ 'psyco_full' ],
-             packages = find_packages( 'lib' ),
-             package_dir = { '': 'lib' },
-             package_data = { '': ['*.ps'] },