Class: Bio::Sequence::AA
- Inherits:
-
Object
- Object
- Bio::Sequence::AA
- Defined in:
- lib/bio/sequence/aa/aa.rb
Instance Method Summary collapse
- #accepted_length ⇒ Object
-
#bs_group ⇒ Object
return the block sharing group.
- #c_terminal_motif ⇒ Object
-
#cys_count ⇒ Object
number of cysteines.
-
#cyspolv_group ⇒ Object
Assigning dsid group based on number of cysteines, presence of REY motif in polv2 and MFK in polv1,.
-
#dsid ⇒ Object
distict sequence identifier(DSID).
- #end_motif ⇒ Object
- #groupA_status ⇒ Object
- #has_accepted_length? ⇒ Boolean
-
#is_groupA_like? ⇒ Boolean
return var group A like tags.
- #is_var1? ⇒ Boolean
- #is_var1_cp1? ⇒ Boolean
- #is_var1_cp2? ⇒ Boolean
- #n_terminal_motif ⇒ Object
-
#polv1 ⇒ Object
The first position of limited variability(polv1).
- #polv1_pos ⇒ Object
-
#polv1_to_polv2 ⇒ Object
get the 5’ end of the sequence from the ‘middle’.
-
#polv2 ⇒ Object
The second position of limited variability(polv2).
- #polv2_pos ⇒ Object
-
#polv3 ⇒ Object
The third position of limited variability(polv3).
- #polv3_pos ⇒ Object
-
#polv3_to_polv4 ⇒ Object
get the 3’end of the sequence from the “middle”.
-
#polv4 ⇒ Object
The fourth position of limited variability(polv4).
- #polv4_pos ⇒ Object
-
#pspb1(anchor_pos = 0, win_len = 14) ⇒ Object
position specific polymorphic block 1.
-
#pspb2(anchor_pos = 0, win_len = 14) ⇒ Object
position specific polymorphic block 2.
-
#pspb3(anchor_pos = 0, win_len = 14) ⇒ Object
position specific polymorphic block 3.
-
#pspb4(anchor_pos = 0, win_len = 14) ⇒ Object
position specific polymorphic block 4.
- #sig2_like? ⇒ Boolean
- #sig2_status ⇒ Object
- #start_motif ⇒ Object
- #var1_status ⇒ Object
- #vw_missing? ⇒ Boolean
- #vw_pos ⇒ Object
- #vw_ww_missing? ⇒ Boolean
- #ww_missing? ⇒ Boolean
- #ww_pos ⇒ Object
Instance Method Details
#accepted_length ⇒ Object
202 203 204 |
# File 'lib/bio/sequence/aa/aa.rb', line 202 def accepted_length 100..168 end |
#bs_group ⇒ Object
return the block sharing group
117 118 119 120 121 122 123 124 125 126 127 |
# File 'lib/bio/sequence/aa/aa.rb', line 117 def bs_group case when self =~ /(?:R(?:HYADHDKSGNYYK|NENNNLGKLSNEQ|I(?:RHYDDGSGNY(?:SK|YK)|THYN(?:GVSGNCVK|DGSGNYVK))|E(?:RYKDLKDVEIDD|HYKEVKNGNY(?:YK|IK)|KYKDLKD(?:VEIDD|LPIDD))|VKETYKDDPNYYK|KNNSSLRKLTNEQ)|G(?:G(?:RGRK(?:KLEDNL(?:IE|KE)|QLEENLQK)|GGRKKLEDNLKE)|I(?:N(?:D(?:Y(?:ND(?:GSGNYFK|ISGNYYK)|D(?:RDGPE(?:HYK|YYK)|GDGPEYYK))|CDRDGPEYYK)|AYNDGSENYYK)|IDYDHDGPHYYK)|P(?:SQEK(?:IKLEENLK|KKLEENLK)|KQEKKELEENLK)|K(?:NYPDDGSGN(?:YYK|FYK)|K(?:YYND(?:G(?:SGNYYK|TGNYVK)|ETGNYYK)|KEKEKIYGNIE)|QYYNDENGNYYK)|QTYPDDGSGNYYK)|MESNANLKKHTLER|S(?:STNTQCRCATNDV|HY(?:TDTHGSIDYDK|ED(?:GDKSGNYYK|KDKSGNYIK)|ADHDKSGNY(?:YK|LK))|NKEKEKIENSLQN|DYKDDD(?:GSGNYYK|IDGNYY(?:K|Q))|E(?:GKCGHKETERDL|KVEYGLRKLFKK)|VQERYGNDPNFFQ|KI(?:NDYDGDPNYYK|TDYDNDPNYYK)|QGQCGRNENNGYP|F(?:S(?:SEYCGH(?:RQGS(?:V|A)|GDNEV|EQGNV)|N(?:GQCGHRDENV|SKCGHGEHEV|DYCGH(?:RQGSV|NENKV)|PKCGH(?:G(?:DNEV|EHEV)|NENKV|EQGNV)|EYCGHRQGSV)|D(?:RKCGHYEGAP|HKCGH(?:GDKDV|YEGAP|DENAP)))|TN(?:GQCGHNEENV|PKCG(?:RGDNEV|H(?:G(?:DNEV|EHEV)|DENKV)))|ADAYCGRGDENV)|LILPYSKCGRDTD)|H(?:HYKDDDISGNYSK|SKEKEKLQTNLKN|N(?:H(?:IKKPLLENLEQ|KKKPLL(?:DNLEK|ENLEQ))|NKKKALLDNLEK|QKKINLEKSLHR)|EQG(?:YNKLEAI(?:SKT|LKT)|NNKLEA(?:RLKT|ILKT))|QQRK(?:RKLEENLRN|GKLEENLRN))|C(?:RAP(?:N(?:GANYFRKGL|EANYFKNVA)|KNAHYFIKSS|QKANYFKNVA)|G(?:TGENDTYFKNSS|A(?:G(?:EKDTYF(?:TYS(?:N|K)|VQLD)|A(?:RDEYFIKPS|KDTYFTYSK))|TMNDIFSKNIG|LPKSAY(?:VLQSE|F(?:MQLE|LQSE))))|S(?:VPYEAYYFTYKS|A(?:G(?:PKDTYFIKSG|QKDTYFIKPN)|D(?:GSE(?:DYFIKSS|EYF(?:IQSE|KKQS))|DSEDYFI(?:RSE|QSE))|P(?:RDA(?:DYFIKNS|QYFIKSS)|GD(?:VNYFRK(?:GL|IS|ES|FS)|AKYVK(?:YFP|NFP))|HNAQYVKYVP|Y(?:GANYYRKYS|HPGYFRQSK|YADYF(?:RKGS|K(?:SVA|KK(?:S|P)))|NAHYFIKSS|CADYFKKKS|DANYVRRKS|EA(?:YYFTYKS|QYFIKSS)|KSQYFIKSS)|D(?:YAKYFRQTC|NAKY(?:VKYFP|FKPPK)))|QNNEVYFINSE))|Y(?:IPY(?:YVNYFK(?:NIS|DIS|K(?:T(?:S|P)|KS))|CVNYFKNIS)|APNNANYFIGSG)|NAP(?:GD(?:VHYFRKDP|AHYFRKDP)|Y(?:DANY(?:YR(?:KYS|QTC)|VRRKS|FRKTS)|EAQY(?:YIKSS|FIK(?:SS|PS))|K(?:SRYF(?:M(?:HSE|QSE)|IQSE)|A(?:QYYIKSS|WYFMHSE)))|NISGYFMQS(?:G|E)|D(?:NVNYFRKYS|KAEYFVYKS))|TAP(?:YGANYYRKYS|D(?:NVNYFRKYS|KANYFIYKS))|IAPRDAHYFLKSS|D(?:TEESDTYFKQSS|A(?:SYKSGYFMQSE|P(?:RDA(?:HYFLKSS|NFFIKNS|DYF(?:RKGS|KNVA))|YKSRYF(?:MQSE|IQSE)|KDANYFIGSG|QKVDYFRK(?:GS|IS))))|EA(?:SKNANFFIK(?:NS|DS)|P(?:GDAHYFRKGP|ENAYIIKRRI|KDANYFIGSG|QKVDYFRKG(?:S|L)))|VA(?:GEGNTYFIQLD|PENAYFRKTEA)|KA(?:S(?:RNA(?:HYFLKSS|NYFRK(?:IS|AL))|KNANFFIKNS)|P(?:GDVN(?:YFRKIS|FFIKNS)|NGANYFRKKS|TGA(?:HYFLKSS|DYF(?:VYKP|KKKS))|PKVDYSRNIS|EDADYFRKGS|K(?:GANYFRKES|DA(?:HYFLKSS|N(?:YFIGSG|FFIKIS)|DYFRKGS))|Q(?:GANYFRNIS|SVHYFIKTS|DANYF(?:R(?:N(?:IS|VS)|K(?:GL|IS))|TKES)|K(?:VDYFRKGS|ANYFRKGS)))|KEGDIYSKTTD)|FA(?:HNTEEYFIKSE|DGSEEYFI(?:KSS|QS(?:S|E)))|AAR(?:GNDLYSKNIG|YHPGYFKKSD))|Y(?:NERDR(?:DKKRKLQE|EKKRKLQD|AQKKKLQD)|DEKEKNRRKQLEN|KAP(?:RKA(?:NYFIYKS|DYFRNIS)|KDAHYFLKSS|QDANYFRNVS))|N(?:RKEKGKLQTNLKN|GDYK(?:EKVSNNL(?:RA|KT)|KKVSNNLKT)|HYKDD(?:NGS(?:GNYYK|ENYYK)|D(?:GSGNYYK|ISGNY(?:SK|YK)))|SDDKVE(?:NGLKKVF|KGLREVF)|Y(?:Y(?:NNTGNN(?:V(?:NYAK|DYVK)|ANYAK)|ADGDKSGNYYK)|NYDEDGSGNY(?:YK|VK))|N(?:HDNVE(?:NGL(?:REVF|KAVF)|KGLK(?:KVF|AVF))|D(?:ND(?:RVKKEKLQN|K(?:IKK(?:GKLRG|EKL(?:RG|QE))|VKKEKL(?:RG|QN)))|DDKIKKGKLRG|V(?:EKGL(?:DVVFKK|KVVFKK)|VKGLDVVFKK))|E(?:SE(?:IKRKEKLRG|KKKREELQG)|TDKEQKVKLEK|KDM(?:REKQKLQS|TEKQKLQS))|VDAVQEGLKVVF|KE(?:NEKLQENLKR|KEKIEKSLQN))|TVDK(?:IHEGLKVVF|VHEGLKVVF)|D(?:NVE(?:NGLREVFKK|KGLK(?:KVFDK|AVFRK))|DVEKGLKIVFEK|EDDVEKGLKIVF|K(?:D(?:YVENGLKKVF|A(?:V(?:RHGLKVVF|QKGLRAVF)|AQKVLRTVF))|EKDQRKKLDE(?:N|I)|VE(?:NGL(?:REVFKK|KKVFDK)|KGL(?:REVF(?:RK|KK)|QVVFGK)))|QD(?:DVEKGLKIVF|EVWNGLRSVF)|ADKV(?:EKGLQVVF|QKGLQVVF))|P(?:E(?:DKVHEGLKVVF|VE(?:NGLREVFNK|KGLKAVFRK))|QDKVQ(?:EGLK(?:NVF|VVF)|KGLREVF))|E(?:MVEIGLKKVFKK|HYKEVKNGNYVK|NVEKGL(?:K(?:IVFEK|KVFDK)|QVVFGK)|D(?:DKVQKGLQVVF|VEKGLKVVF(?:KK|QK))|EDAVQKGL(?:RAVF|K(?:VVF|KVF))|K(?:DAVQNGLKKVF|VE(?:YGLRKLFKK|IGLKKVF(?:DK|EK|KK)))|QDEVWKGLRDVF)|VH(?:YK(?:DDGS(?:GNYYK|ENYYK)|EVKNGNYVK)|DKVE(?:RGLREVF|TGLREVF|KGL(?:REVF|QVV(?:F|L))))|K(?:HDNIEKGLREVF|N(?:NVPL(?:HNLSLDK|DKLSLDK)|K(?:SPLDKLSLEQ|PPLDKLSVDK)|VEIGLK(?:NVFKN|KVFDK))|DDK(?:IEKSLRAIF|V(?:EKGLRAIF|QKGL(?:RAVF|KAVF|QVVF)))|Q(?:RKKILQEKLEN|EKEKREKLDEN))|FSNPKCGH(?:DEGIV|KQGNV)|QEDKVQEGLKVVF|LILTHPKCGHDTD)|I(?:SYYNADEKGNFYK|HNYDDNGSGNYYK|E(?:TRY(?:GSDTTNYYQ|ENDGPNYYQ)|ARYKKDDDNYYQ)|VSFDQCGHND(?:MDV|VDV)|KNDKTLNNLSNGQ|FSNEHCGHKQGSV)|T(?:SEGQCGHNDKMRP|HYADEDGS(?:GNYVK|ENYYK)|D(?:N(?:D(?:EVW(?:TGLRSVF|KGL(?:RSVF|GSVF))|AVQKGLRAVF)|VE(?:NGLREVFKK|KGLRAVFGK))|K(?:D(?:YVENGLK(?:KVF|AVF)|DVENGLREVF|EV(?:KEGLKVVF|WKGLRAVF)|AVQKGLRAVF)|VENGLK(?:EVFDK|KVFD(?:N|K))))|E(?:GYCGRNENNGYP|TLYKDEEGNYLK|KDDVEKGLKIVF)|V(?:S(?:SNKCGHNDMDV|NAKRREGDENP|FDQCGHNDM(?:HV|DV))|K(?:GTYKDDPYYYK|ETYKDDPNYYK))|F(?:S(?:GYWCGHYEGAP|NDYCGHGEHEV)|TYTKCGHDENKV))|D(?:SRTDKLEENLRKI|NNSDKLRDLSVDK|DDVEKGLKIVFEK|K(?:GEKKKLEKNLKD|NRGKLGALSLDD))|P(?:SY(?:IKCGHNNKDDP|LKCGHNNKDDP)|HYTNDRGLADYVK)|E(?:HY(?:EDVDGSGNYLK|KDVDGSGNYYK)|YY(?:NDTNNKINYVK|EDKDPDKNYYQ)|KNY(?:YNDGTGNYYK|PDDGSGNYSK)|FT(?:GGYCGRDETDV|SGYCGRNETNV))|V(?:NGNDKLESNLKKI|KAHY(?:KKDAPYYYK|QKDAPNYYK)|FSNRQCGHYED(?:VP|AP))|K(?:RYYNDDTD(?:NN(?:FYQ|LYQ)|DNFYQ)|GINDYDGDPNYYK|SYY(?:NAD(?:GEGNFYK|EKGNYYK)|DADEKGNYYK)|HY(?:TDTHGSIDYDK|A(?:H(?:GDGSGNY(?:SK|YK|LK)|DDGS(?:GNYYK|VNYYK))|DEDGSGNYYK))|YYNDTNNKINYVK|N(?:Y(?:YNPD(?:G(?:SGNYYK|AGNYYK)|EAGNYYK)|NYD(?:EDGPEYYK|KDGPEYYK))|NDRTLNNLSIGQ|DYNPDGSGNY(?:YK|FK)|E(?:SE(?:IKRKEKLQR|K(?:RTKEKLQG|NTKKKLQG))|NTDLNKLTTEK)|KNTKLSTLTLEK|AYPDDG(?:SGNY(?:YK|FK)|FGNYYK))|T(?:SN(?:SN(?:MDTLSLEQ|LKELSLDK)|TNMNTLSLDK)|IYADLKDVEIDD)|I(?:NDYDGDGPEYYK|THYDDISGNYYK|KDYDGDGPEYYK)|D(?:HY(?:KDEKDGNFFQ|QDDGTGNYYK)|YYNADEKGNYYK)|PHYKDDGFGNYYK|E(?:YYQDDGTGNYYK|ISDYDNDPNYYK|EYGDLKDVPIDD|KYGDLKDVPIDD)|V(?:HYKENKDGNY(?:YK|VK)|KY(?:PDL(?:ND(?:IEIDD|VEIDD)|KDLQIDD)|QDLKDVEIDD))|K(?:HY(?:ENDTDKNYYQ|KKDEDPNYYK)|VYPEDVTGNY(?:YK|FK)|KKKGLSELSTEK)|FS(?:SDRCGHNEGDP|ERKCGH(?:NEGSP|DENAP))|Q(?:HYK(?:DDGSVNYYK|EDKDENYYK)|NNKKLKDLTDKH)|A(?:RYKDRKDPNYYK|K(?:YEDLKTLPIDD|ERYKDIKNYYQ)))|F(?:S(?:S(?:SGPCGRDEAPV|HGKCGHNEGAP|DRCGHNNNDGP|E(?:GKCGHKEGTV|YCGHYKNGDP)|QGQCGHTEGTV)|N(?:RGPCGRNETDV|S(?:G(?:TRGRKELTV|PCGRKELTV|KCGGKEAPV)|KCGHHNNDGP)|N(?:GPCGRNETDV|KCGHSNGGDP)|PKCGHSNGGDP|E(?:HCGH(?:HNNDDP|YKNGDP)|YCGH(?:YKNGDP|KKNEDP)))|DNG(?:HCGRNETNV|PCGRKELIV))|T(?:RQGYCGHSETNV|GGGQC(?:RRNDNSV|GRNETDV)|S(?:HGKCG(?:RNETNV|HSEGAP)|IGKCGHNKGSV|EG(?:RCGHSETNV|KCG(?:RNETNV|HNDNRV)|Q(?:RGHSETNV|C(?:RRNDNSV|GH(?:SETNV|NDKSV|DENKV))))|VGYCGHNKG(?:SV|IR)|QG(?:YCG(?:RKE(?:LTV|APV)|HSETNV)|QCG(?:RNERNV|H(?:SETNV|TEGTV|KEGTV)))|AGKCR(?:RNDNSV|HNDNSV))|NDGKCG(?:RYEGAP|H(?:YE(?:GAP|NNI|D(?:NV|AP))|TEGTV))|TEGYCGR(?:NEGAP|DEGAP)|D(?:GHCGRTQEGHV|IGKCG(?:GKEAPV|H(?:GDKDV|N(?:EGAP|KGSV)|KQGNV))|DGKCGHYEGAP))|ENAGKC(?:RRNDNKV|GHNDNRV)|WDRKCGHSN(?:GGDP|EGA(?:P|L))|LYPKCGHNNKNDL)|Q(?:GIIDYDNDPNYYK|NYY(?:KDDPKKNYYK|ADDGSGNY(?:SK|VK))|ISDY(?:TGDHPNYYK|DGDGPEYYK)|K(?:SDSSLQRLSIEK|HYEDDGSGNYYK|NNSALKKLTDKQ|IY(?:EDINNLPIDD|KDLNNLPIDD))|QNNNTLENLTDKQ)|L(?:K(?:TRYKKDDDNYYQ|KHYQKDAPNYYK)|F(?:S(?:N(?:RQCGH(?:GEHEV|NEGAP|DENKV|EQGNV)|SKCGH(?:RQGNV|DE(?:SKV|NKV)|EQGNV)|YKCGHYEDAP|DYCGHKQGNV|PKCGH(?:EQG(?:NV|TV)|KQGKV)|AYCGHYEGSP)|D(?:GHCGNKDGTV|HKCGHEESRV|YKCGHYE(?:GSP|DAP)))|DYNCGHHKDNNV|WDRKCGHDERNV)|Q(?:TRYTNDGDNYFK|ERYNDPKGDFFQ|ARYKKDGDDFFK)|WNDKCGHHVDKDV|LFSNYKCGHYEGS)|A(?:RYKKDEEDGNYY(?:K|Q)|VSSNKCGHNDMNV|KNDYTGDHPNYYK|LKHYKDDTKNYYQ))/ block_sharing = 1 when self =~ /(?:RE(?:PGKQHLEERLER|KGKSRLEARLKT)|G(?:G(?:HYKNCHCIGGDV|TYKNCRCASGNV)|P(?:NQEKKLLENKLK|DQEKKKLEENLR)|ANAIKAGDNVSIV)|S(?:FTNGQCGRDGENV|WYPKCGHHVKQDV|AKEHYQDTENYYK)|H(?:NRRKEKLETRLEE|E(?:PG(?:IQ(?:HLEKRLES|YLEKRLES)|KQHL(?:GERLEQ|EERLE(?:R|Q)))|QG(?:YNRLEARLKT|NNRLEARLKT|INRLEARLKT))|QQRKHLLEKRLET)|C(?:RAEEK(?:GTYFKNRE|D(?:TYFKNRE|IYSKTTD)|EIYSKTTD)|G(?:TEDKDTYFIKSG|VEENAKYFRESS|A(?:GMKDIYSKTMN|SEDAKYKVIGP|T(?:MNDIFSKNIR|VDDI(?:SSKNIR|FSKNIR))|P(?:SDAQYFRNTC|KEAKYFRKTA)))|HAPPDAQYTKKGP|NA(?:P(?:TGADYFVYKP|KDANYFEYNS)|WGNTYFRKTCS)|DAG(?:QKDTYFKQSS|AADEYFKKSG)|EA(?:GTSDKYFRKTA|KSDDKYNVIGP)|KA(?:NDDAEYFRKKD|P(?:DKANYF(?:EPPK|KPPK)|EEDHYFKPAQ)|EVDDIYSKTAN|K(?:EGDIYSKT(?:MN|AN)|KG(?:GIYSKTMN|DIYSKTMN))))|Y(?:SQKYKDEKSKLEE|NE(?:TDKVQKAILQQ|KDQEEKRKLQE))|N(?:YYEDNDTDKNYYQ|NNAAKLSELSTAQ|THESAQRKKLEEN|DEEKKKRDELEKN|KN(?:NPPLYKLSLEK|KSPLDKLSLDK))|T(?:RYKKDDEDGNFFQ|PTQGKCHCIDGT(?:N|V)|L(?:FDYKCGHDENAP|WNEKCGHGDYNL))|I(?:EHYKDDPEENFYE|KS(?:NYNDSEGNYFK|QYDDNEGNYFK)|LFDYKCAHDNDKV)|D(?:RKEKVKLEENLKN|KGEKKKLEENLKN|Q(?:ERK(?:HLLEKRLET|QHLEKRLET)|QEK(?:LYLENNLKK|AKLENNLKR))|AKKHYGDDENYYK)|P(?:NKCRCEDANADQV|CSVQKCTCINGDP)|E(?:SN(?:M(?:GQCRCFSGDP|VQCRCFSGDP)|KGQCRCFSGDP)|THGYCRCVNRVDV|F(?:SGGKCGHKDNNV|T(?:GGQCGRDGENV|DGHCGH(?:RQGNV|NEENV))))|VKDRYQNDGPDFFK|K(?:S(?:SYNDDGTGNYFK|YYKNDNDRNYFK)|N(?:HYNDTSKNYYK|NNN(?:ELNNLSLDK|KLSNLSTKE))|D(?:HYKGDEANNYFQ|NNTKLNDLSIQE)|K(?:TNPALKSFTNEE|KLEENLRNIFKN)|FSNPKCGHNEGSP)|F(?:SNDQCGHNN(?:RGDP|GGAP)|WYPKC(?:GHHV(?:RQDV|KQ(?:DV|EV))|SHHVKQDV))|Q(?:RNNIKLQ(?:NIPLHE|TLTLHQ)|N(?:NNTKLQNIPLHE|KNENLKSLSLDK)|KENGDINTLKPEE)|L(?:FYYKCGHYVYKDV|WN(?:Y(?:NCGHHVN(?:RDV|QDV)|KCGHHVNQDV)|DKCGHHVKQDV))|ARDHYNDTSGNYYQ)/ block_sharing = 2 else block_sharing = 0 end block_sharing end |
#c_terminal_motif ⇒ Object
21 22 23 |
# File 'lib/bio/sequence/aa/aa.rb', line 21 def c_terminal_motif self[-5,self.length] end |
#cys_count ⇒ Object
number of cysteines
34 35 36 |
# File 'lib/bio/sequence/aa/aa.rb', line 34 def cys_count scan(/C/).size end |
#cyspolv_group ⇒ Object
Assigning dsid group based on number of cysteines, presence of REY motif in polv2 and MFK in polv1,
81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 |
# File 'lib/bio/sequence/aa/aa.rb', line 81 def cyspolv_group case when cys_count > 4 || cys_count == 3 || cys_count < 2 group = 6 when cys_count == 4 && polv2 =~ /REY/i group = 5 when cys_count == 4 group = 4 when cys_count == 2 && polv1 =~ /MFK/i group = 1 when cys_count == 2 && polv2 =~ /REY/i group =2 else group = 3 end group end |
#dsid ⇒ Object
distict sequence identifier(DSID)
166 167 168 |
# File 'lib/bio/sequence/aa/aa.rb', line 166 def dsid "#{polv1}-#{polv2}-#{polv3}-#{cys_count.to_s}-#{polv4}-#{self.length}" end |
#end_motif ⇒ Object
12 13 14 15 |
# File 'lib/bio/sequence/aa/aa.rb', line 12 def end_motif #warn "[DEPRECATION] 'end_motif' is deprecated. Please use `c_terminal_motif` instead." c_terminal_motif end |
#groupA_status ⇒ Object
155 156 157 158 159 160 161 162 |
# File 'lib/bio/sequence/aa/aa.rb', line 155 def groupA_status if is_groupA_like? status = 'groupA_like' else status = 'other' end status end |
#has_accepted_length? ⇒ Boolean
3 4 5 |
# File 'lib/bio/sequence/aa/aa.rb', line 3 def has_accepted_length? true if accepted_length.include? self.length end |
#is_groupA_like? ⇒ Boolean
return var group A like tags. Group A like sequences are associated with disease severity.
151 152 153 |
# File 'lib/bio/sequence/aa/aa.rb', line 151 def is_groupA_like? return true if cys_count == 2 && bs_group == 1 end |
#is_var1? ⇒ Boolean
137 138 139 |
# File 'lib/bio/sequence/aa/aa.rb', line 137 def is_var1? return true if is_var1_cp1? || is_var1_cp2? end |
#is_var1_cp1? ⇒ Boolean
129 130 131 |
# File 'lib/bio/sequence/aa/aa.rb', line 129 def is_var1_cp1? return true if cyspolv_group == 1 && self =~ /NVHDKVEKGLREVF|NVHDKVETGLREVF/i end |
#is_var1_cp2? ⇒ Boolean
133 134 135 |
# File 'lib/bio/sequence/aa/aa.rb', line 133 def is_var1_cp2? return true if cyspolv_group == 2 && self =~ /APNKEKIKLEENLKK/i end |
#n_terminal_motif ⇒ Object
17 18 19 |
# File 'lib/bio/sequence/aa/aa.rb', line 17 def n_terminal_motif self[0,5] end |
#polv1 ⇒ Object
The first position of limited variability(polv1)
49 50 51 |
# File 'lib/bio/sequence/aa/aa.rb', line 49 def polv1 self[10,4] end |
#polv1_pos ⇒ Object
99 100 101 |
# File 'lib/bio/sequence/aa/aa.rb', line 99 def polv1_pos index(polv1) end |
#polv1_to_polv2 ⇒ Object
get the 5’ end of the sequence from the ‘middle’
39 40 41 |
# File 'lib/bio/sequence/aa/aa.rb', line 39 def polv1_to_polv2 slice(rindex(polv1),rindex(polv2) - 6) end |
#polv2 ⇒ Object
The second position of limited variability(polv2)
54 55 56 57 58 59 60 61 62 |
# File 'lib/bio/sequence/aa/aa.rb', line 54 def polv2 if !ww_missing? return self[ww_pos - 4,4] elsif !vw_missing? return self[vw_pos - 12,4] else return '....' end end |
#polv2_pos ⇒ Object
103 104 105 |
# File 'lib/bio/sequence/aa/aa.rb', line 103 def polv2_pos index(polv2) end |
#polv3 ⇒ Object
The third position of limited variability(polv3)
65 66 67 68 69 70 71 72 73 |
# File 'lib/bio/sequence/aa/aa.rb', line 65 def polv3 if !ww_missing? return self[ww_pos + 10,4] elsif !vw_missing? return self[vw_pos + 2,4] else return '....' end end |
#polv3_pos ⇒ Object
107 108 109 |
# File 'lib/bio/sequence/aa/aa.rb', line 107 def polv3_pos index(polv3) end |
#polv3_to_polv4 ⇒ Object
get the 3’end of the sequence from the “middle”
44 45 46 |
# File 'lib/bio/sequence/aa/aa.rb', line 44 def polv3_to_polv4 slice(rindex(polv3),(rindex(polv4) - rindex(polv3) + 4)) end |
#polv4 ⇒ Object
The fourth position of limited variability(polv4)
76 77 78 |
# File 'lib/bio/sequence/aa/aa.rb', line 76 def polv4 self[self.length - 12,4] end |
#polv4_pos ⇒ Object
111 112 113 |
# File 'lib/bio/sequence/aa/aa.rb', line 111 def polv4_pos index(polv4) end |
#pspb1(anchor_pos = 0, win_len = 14) ⇒ Object
position specific polymorphic block 1
171 172 173 |
# File 'lib/bio/sequence/aa/aa.rb', line 171 def pspb1(anchor_pos=0,win_len=14) self[14 + anchor_pos,win_len] end |
#pspb2(anchor_pos = 0, win_len = 14) ⇒ Object
position specific polymorphic block 2
176 177 178 179 180 181 182 183 184 |
# File 'lib/bio/sequence/aa/aa.rb', line 176 def pspb2(anchor_pos=0,win_len=14) if !ww_missing? return self[ww_pos - 4 - anchor_pos - win_len, win_len] elsif !vw_missing? return self[vw_pos - 12 - win_len - anchor_pos, win_len] else return '....' end end |
#pspb3(anchor_pos = 0, win_len = 14) ⇒ Object
position specific polymorphic block 3
187 188 189 190 191 192 193 194 195 |
# File 'lib/bio/sequence/aa/aa.rb', line 187 def pspb3(anchor_pos=0,win_len=14) if !ww_missing? return self[ww_pos + 14 + anchor_pos, win_len] elsif !vw_missing? return self[vw_pos + 6 + anchor_pos, win_len] else return '....' end end |
#pspb4(anchor_pos = 0, win_len = 14) ⇒ Object
position specific polymorphic block 4
198 199 200 |
# File 'lib/bio/sequence/aa/aa.rb', line 198 def pspb4(anchor_pos=0,win_len=14) self[self.length - 12 - win_len - anchor_pos, win_len] end |
#sig2_like? ⇒ Boolean
218 219 220 |
# File 'lib/bio/sequence/aa/aa.rb', line 218 def sig2_like? return true if self =~ /AKLSELSTAQ|CRAEEKDTYF|KCGHHVNQDV|HEPGKQHLEE|EPGKQHLEER|PGKQHLEERL|GKQHLEERLE|KQHLEERLEQ|QHLEERLEQM|HLEERLEQMF|LEERLEQMFE|EERLEQMFEN|ERLEQMFENI|RLEQMFENIK|LEQMFENIKN|EQMFENIKNN|QMFENIKNNN|MFENIKNNNA|FENIKNNNAA|ENIKNNNAAK|NIKNNNAAKL|IKNNNAAKLS|KNNNAAKLSE|NNNAAKLSEL|NNAAKLSELS|NAAKLSELST|AAKLSELSTA|RAEEKDTYFK|AEEKDTYFKN|EEKDTYFKNR|EKDTYFKNRE|KDTYFKNREN|DTYFKNRENG|TYFKNRENGK|YFKNRENGKL|FKNRENGKLL|KNRENGKLLL|NRENGKLLLW|RENGKLLLWN|ENGKLLLWNY|NGKLLLWNYK|GKLLLWNYKC|KLLLWNYKCG|LLLWNYKCGH|LLWNYKCGHH|LWNYKCGHHV|WNYKCGHHVN|NYKCGHHVNQ|YKCGHHVNQD|AKLSELSTAQ|CKAKEGDIYS|NCGHHVNQDV|HEPGKQHLEE|EPGKQHLEER|PGKQHLEERL|GKQHLEERLE|KQHLEERLEQ|QHLEERLEQM|HLEERLEQMF|LEERLEQMFE|EERLEQMFEN|ERLEQMFENI|RLEQMFENIK|LEQMFENIKN|EQMFENIKNN|QMFENIKNNN|MFENIKNNNA|FENIKNNNAA|ENIKNNNAAK|NIKNNNAAKL|IKNNNAAKLS|KNNNAAKLSE|NNNAAKLSEL|NNAAKLSELS|NAAKLSELST|AAKLSELSTA|KAKEGDIYSK|AKEGDIYSKT|KEGDIYSKTA|EGDIYSKTAN|GDIYSKTANG|DIYSKTANGN|IYSKTANGNT|YSKTANGNTT|SKTANGNTTL|KTANGNTTLW|TANGNTTLWN|ANGNTTLWNY|NGNTTLWNYN|GNTTLWNYNC|NTTLWNYNCG|TTLWNYNCGH|TLWNYNCGHH|LWNYNCGHHV|WNYNCGHHVN|NYNCGHHVNQ|YNCGHHVNQD|GDINTLKPEE|CRAEEKDIYS|NCGHHVNQDV|HEPGKQHLEE|EPGKQHLEER|PGKQHLEERL|GKQHLEERLE|KQHLEERLER|QHLEERLERI|HLEERLERIF|LEERLERIFA|EERLERIFAN|ERLERIFANI|RLERIFANIQ|LERIFANIQK|ERIFANIQKE|RIFANIQKEN|IFANIQKENG|FANIQKENGD|ANIQKENGDI|NIQKENGDIN|IQKENGDINT|QKENGDINTL|KENGDINTLK|ENGDINTLKP|NGDINTLKPE|RAEEKDIYSK|AEEKDIYSKT|EEKDIYSKTT|EKDIYSKTTD|KDIYSKTTDN|DIYSKTTDNG|IYSKTTDNGK|YSKTTDNGKL|SKTTDNGKLI|KTTDNGKLIL|TTDNGKLILW|TDNGKLILWN|DNGKLILWNY|NGKLILWNYN|GKLILWNYNC|KLILWNYNCG|LILWNYNCGH|ILWNYNCGHH|LWNYNCGHHV|WNYNCGHHVN|NYNCGHHVNQ|YNCGHHVNQD/ end |
#sig2_status ⇒ Object
222 223 224 225 226 227 228 229 |
# File 'lib/bio/sequence/aa/aa.rb', line 222 def sig2_status if sig2_like? sig2 = 'sig2_like' else sig2 = 'other' end sig2 end |
#start_motif ⇒ Object
7 8 9 10 |
# File 'lib/bio/sequence/aa/aa.rb', line 7 def start_motif #warn "[DEPRECATION] 'start_motif' is deprecated. Please use `n_terminal_motif` instead." n_terminal_motif end |
#var1_status ⇒ Object
141 142 143 144 145 146 147 148 |
# File 'lib/bio/sequence/aa/aa.rb', line 141 def var1_status if is_var1? status = 'var1' else status = 'other' end status end |
#vw_missing? ⇒ Boolean
210 211 212 |
# File 'lib/bio/sequence/aa/aa.rb', line 210 def vw_missing? true unless self =~ /VW/i end |
#vw_pos ⇒ Object
29 30 31 |
# File 'lib/bio/sequence/aa/aa.rb', line 29 def vw_pos rindex("VW") end |
#vw_ww_missing? ⇒ Boolean
214 215 216 |
# File 'lib/bio/sequence/aa/aa.rb', line 214 def vw_ww_missing? true if ww_missing? && vw_missing? end |
#ww_missing? ⇒ Boolean
206 207 208 |
# File 'lib/bio/sequence/aa/aa.rb', line 206 def ww_missing? true unless self =~ /WW/i end |
#ww_pos ⇒ Object
25 26 27 |
# File 'lib/bio/sequence/aa/aa.rb', line 25 def ww_pos rindex("WW") end |