酵母同義和非同義的snp的程式

gaorongchao1990626發表於2013-09-02

use strict;
use warnings;

my $filename;
my @filename;
my $i;
#氨基酸hash
my(%genetic_code) = (     
         
    'TCA' => 'S',    # Serine     
    'TCC' => 'S',    # Serine     
    'TCG' => 'S',    # Serine     
    'TCT' => 'S',    # Serine     
    'TTC' => 'F',    # Phenylalanine     
    'TTT' => 'F',    # Phenylalanine     
    'TTA' => 'L',    # Leucine     
    'TTG' => 'L',    # Leucine     
    'TAC' => 'Y',    # Tyrosine      
    'TAT' => 'Y',    # Tyrosine     
    'TAA' => '_',    # Stop     
    'TAG' => '_',    # Stop     
    'TGC' => 'C',    # Cysteine     
    'TGT' => 'C',    # Cysteine     
    'TGA' => '_',    # Stop     
    'TGG' => 'W',    # Tryptophan     
    'CTA' => 'L',    # Leucine     
    'CTC' => 'L',    # Leucine     
    'CTG' => 'L',    # Leucine     
    'CTT' => 'L',    # Leucine     
    'CCA' => 'P',    # Proline     
    'CCC' => 'P',    # Proline     
    'CCG' => 'P',    # Proline     
    'CCT' => 'P',    # Proline     
    'CAC' => 'H',    # Histidine     
    'CAT' => 'H',    # Histidine     
    'CAA' => 'Q',    # Glutamine     
    'CAG' => 'Q',    # Glutamine     
    'CGA' => 'R',    # Arginine     
    'CGC' => 'R',    # Arginine     
    'CGG' => 'R',    # Arginine     
    'CGT' => 'R',    # Arginine     
    'ATA' => 'I',    # Isoleucine     
    'ATC' => 'I',    # Isoleucine     
    'ATT' => 'I',    # Isoleucine     
    'ATG' => 'M',    # Methionine     
    'ACA' => 'T',    # Threonine     
    'ACC' => 'T',    # Threonine     
    'ACG' => 'T',    # Threonine     
    'ACT' => 'T',    # Threonine     
    'AAC' => 'N',    # Asparagine     
    'AAT' => 'N',    # Asparagine     
    'AAA' => 'K',    # Lysine     
    'AAG' => 'K',    # Lysine     
    'AGC' => 'S',    # Serine     
    'AGT' => 'S',    # Serine     
    'AGA' => 'R',    # Arginine     
    'AGG' => 'R',    # Arginine     
    'GTA' => 'V',    # Valine     
    'GTC' => 'V',    # Valine     
    'GTG' => 'V',    # Valine     
    'GTT' => 'V',    # Valine     
    'GCA' => 'A',    # Alanine     
    'GCC' => 'A',    # Alanine     
    'GCG' => 'A',    # Alanine     
    'GCT' => 'A',    # Alanine         
    'GAC' => 'D',    # Aspartic Acid     
    'GAT' => 'D',    # Aspartic Acid     
    'GAA' => 'E',    # Glutamic Acid     
    'GAG' => 'E',    # Glutamic Acid     
    'GGA' => 'G',    # Glycine     
    'GGC' => 'G',    # Glycine     
    'GGG' => 'G',    # Glycine     
    'GGT' => 'G',    # Glycine     
    );     


my $jianji_number=0;
my %hash;
my $DNA;
my @DNA;
my $jianji;
my $first;
my $second;
my $base;
my @information;
my $key1;
my $key2;
my $key3;
my $rever_first;
my $rever_second;
my $yushu;
my $position;
#一下程式對每一個染色體做一個hash
@filename=qw/I II III IV V VI VII VIII IX X XI XII XIII XIV XV XVI/;
foreach $filename (@filename)
{
	$jianji_number=0;
	undef(@DNA);
	open(IN1,"chr$filename")||die("can not open");
	$i=<IN1>;
	@DNA=<IN1>;
	$DNA=join('',@DNA);
	$DNA=~s/\s//g;
	for($position=0;$position<length $DNA;++$position)#hash中後面一個數字就是鹼基的位置。本來少1個，但是我們人為的加上了1
	{
		$base=substr($DNA,$position,1);
		$hash{$filename}{$position+1}="$base";
	}
}


open(OUT,">TY_and_FTY.txt")||die("can not open");
open(IN,"information_of_tongyi_or_not.txt")||die("can not open");
while(<IN>)
{
	chomp;
	@information=split/\s+/,$_;
	if($information[8] eq "+")
	{
	    $key1=$hash{$information[0]}{$information[4]};
	    $key2=$hash{$information[0]}{$information[4]+1};
	    $key3=$hash{$information[0]}{$information[4]+2};
	    if($key1 eq "A" && $key2 eq "T" && $key3 eq "G")
	    {
		    if($information[7]==0)
		    {
			    $first=join('',$information[2],$hash{$information[0]}{$information[1]+1},$hash{$information[0]}{$information[1]+2});
			    $second=join('',$information[3],$hash{$information[0]}{$information[1]+1},$hash{$information[0]}{$information[1]+2});
			    if($genetic_code{$first} eq $genetic_code{$second})
			    {
				    print OUT "@information[0..8] $genetic_code{$first} $genetic_code{$first} TY0\n";
			    }
			    else
			    {
				    print OUT "@information[0..8] $genetic_code{$first} $genetic_code{$second} FTY\n";
			    }
		    }
		    elsif($information[7]==1)
		    {
			    $first=join('',$hash{$information[0]}{$information[1]-1},$information[2],$hash{$information[0]}{$information[1]+1});
			    $second=join('',$hash{$information[0]}{$information[1]-1},$information[3],$hash{$information[0]}{$information[1]+1});
			    if($genetic_code{$first} eq $genetic_code{$second})
			    {
				    print OUT "@information[0..8] $genetic_code{$first} $genetic_code{$second} TY\n";
			    }
			    else
			    {
				    print OUT "@information[0..8] $genetic_code{$first} $genetic_code{$second} FTY\n";
			    }
		    }
		    elsif($information[7]==2)
		    {
			    $first=join('',$hash{$information[0]}{$information[1]-2},$hash{$information[0]}{$information[1]-1},$information[2]);
			    $second=join('',$hash{$information[0]}{$information[1]-2},$hash{$information[0]}{$information[1]-1},$information[3]);
			    if($genetic_code{$first} eq $genetic_code{$second})
			    {
				    print OUT "@information[0..8] $genetic_code{$first} $genetic_code{$second} TY\n";
			    }
			    else
			    {
				    print OUT "@information[0..8] $genetic_code{$first} $genetic_code{$second} FTY\n";
			    }
		    }
	    }
	    else
	    {
		    next;
	    }
    }
	elsif($information[8] eq "-")
	{
	    $key1=$hash{$information[0]}{$information[5]};
	    $key2=$hash{$information[0]}{$information[5]-1};
	    $key3=$hash{$information[0]}{$information[5]-2};
	    if($key1 eq "T" && $key2 eq "A" && $key3 eq "C")#因為這裡是負鏈，所以對應的也應該是ATC的互補鏈，下面的翻譯過程也要注意，所有的要先對應到正鏈的位置上，然後在進行翻譯。
		{
		    print "T\n";
			$yushu=($information[5]+1-$information[1])%3;
			if($yushu==1)                #當反向的時候餘數為1，那麼就是氨基酸的第一位，餘數為2，那麼是氨基酸的第二位，餘數為o為氨基酸的第三位
			{
				$first=join('',$information[2],$hash{$information[0]}{$information[1]-1},$hash{$information[0]}{$information[1]-2});
				$second=join('',$information[3],$hash{$information[0]}{$information[1]-1},$hash{$information[0]}{$information[1]-2});
				$rever_first=revcom($first);
				$rever_second=revcom($second);
				if($genetic_code{$rever_first} eq $genetic_code{$rever_second})
				{
					print OUT "@information[0..8] $genetic_code{$rever_first} $genetic_code{$rever_second} TY\n";
				}
				else
				{
					print OUT "@information[0..8] $genetic_code{$rever_first} $genetic_code{$rever_second} FTY\n";
				}
			}
			elsif($yushu==2)
			{
				$first=join('',$hash{$information[0]}{$information[1]+1},$information[2],$hash{$information[0]}{$information[1]-1});
				$second=join('',$hash{$information[0]}{$information[1]+1},$information[3],$hash{$information[0]}{$information[1]-1});
				$rever_first=revcom($first);
				$rever_second=revcom($second);
				if($genetic_code{$rever_first} eq $genetic_code{$rever_second})
				{
					print OUT "@information[0..8] $genetic_code{$rever_first} $genetic_code{$rever_second} TY\n";
				}
				else
				{
					print OUT "@information[0..8] $genetic_code{$rever_first} $genetic_code{$rever_second} FTY\n";
				}

			}
			elsif($yushu==0)
			{
				$first=join('',$hash{$information[0]}{$information[1]+2},$hash{$information[0]}{$information[1]+1},$information[2]);
				$second=join('',$hash{$information[0]}{$information[1]+2},$hash{$information[0]}{$information[1]+1},$information[3]);
				$rever_first=revcom($first);
				$rever_second=revcom($second);
				if($genetic_code{$rever_first} eq $genetic_code{$rever_second})
				{
					print OUT "@information[0..8] $genetic_code{$rever_first} $genetic_code{$rever_second} TY\n";
				}
				else
				{
					print OUT "@information[0..8] $genetic_code{$rever_first} $genetic_code{$rever_second} FTY\n";
				}
			}
		}
	}
	else 
	{
		next;
	}
}



#子程式：獲得互補序列
sub revcom  
{  
    # A subroutine to compute the reverse complement of DNA sequence   
    # 一個獲取DNA互補序列的子程式  
    my($dna)=@_;  
    print $dna."\n";  
    my ($revcom)=reverse($dna);  
    $revcom=~tr/ACGTacgt/TGCAtgca/;  
    return $revcom;  
}

物件、同義詞和公有同義詞順序選取
2011-02-22
物件
中考常見同義詞和同義短語總結
2024-05-03
【Oracle】-【同義詞】-public與非public同義詞
2013-07-26
Oracle
Oracle中的同義詞SYNONYM
2015-04-29
Oracle
匯出Oracle中的同義詞
2017-02-19
Oracle
SYS查詢不到的同義詞
2010-02-20
Spring 非同步任務的建立、自定義配置和原理
2019-02-14
Spring非同步
深入掌握 ECMAScript 6 非同步程式設計（二）：Thunk 函式的含義和用法
2015-10-14
非同步程式設計函式
程式的定義
2021-01-02
SMART原則的定義和含義
2024-10-13
在程式中定義多個同值不同名的變數
2024-04-20
變數
set unused column和檢視，約束，同義詞和索引的關係
2010-09-11
索引
授權與同義詞
2015-04-13
ORACLE公有/私有同義詞
2013-11-03
Oracle
詳解同義詞(synonym)
2012-02-08
【Oracle】v$表和v_$同義詞的訪問許可權
2011-09-25
Oracle訪問許可權
ASP.NET MVC下的非同步Action的定義和執行原理[轉]
2015-02-03
ASP.NETMVC非同步
以程式設計師的名義，分析 “人民的名義”
2017-05-09
程式設計師
匯出oracle公有同義詞
2021-01-15
Oracle
Oracle同義詞建立方法
2008-03-07
Oracle
多層巢狀同義詞
2009-08-27
巢狀
Oracle同義詞 kingsql作品
2013-03-15
OracleSQL
官檔同義詞學習
2013-01-28
好程式碼的定義
2014-04-22
方法的作用和定義
2024-07-31
併發程式設計：自定義併發類：自定義非同步流（釋出與訂閱）
2020-10-17
程式設計非同步
程式碼，貓和理想主義
2012-09-09
工廠模式建立物件和自定義建構函式建立物件的異同
2019-03-01
模式物件函式
寫論文如何同義轉換
2017-11-15
資料庫鏈與同義詞
2007-02-28
資料庫
Oracle同義詞建立方法(轉)
2007-08-16
Oracle
C++中&和*的含義
2020-02-15
C++
Git分支的定義和操作
2020-12-12
Git
變數的定義和使用
2020-11-22
變數
加密鹽的意義和用途
2017-11-26
加密
mysql 下的提示和含義
2015-04-13
MySql
深入掌握 ECMAScript 6 非同步程式設計（一）：Generator 函式的含義與用法
2015-10-14
非同步程式設計函式
深入掌握 ECMAScript 6 非同步程式設計（四）：async函式的含義與用法
2015-10-14
非同步程式設計函式

酵母同義和非同義的snp的程式

相關文章