- 论坛徽章:
- 145
|
回复 1# 小小脑
which one do you like
$ awk 'FNR==NR{b[$1];next}{d=$3;gsub("/.*","",d);if(d in b)print}' b.txt a.txt
super1_35231_42804 7574 gag_pre-integrs/RVT_2/Retrotran_gag_2/rve
super1_48918_54312 5395 Retrotran_gag_2/gag_pre-integrs/rve/RVT_2
super1_71681_76173 4493 Retrotran_gag_2
super1_192233_199678 7446 Retrotrans_gag/Asp_protease_2/gag-asp_proteas/RVP_2/RVT_1/rve/Chromo
super1_216492_223313 6822 Retrotrans_gag
super1_230561_235028 4468 Retrotran_gag_2/zf-CCHC/zf-CCHC_4
super1_291428_302513 11086 Retrotrans_gag/RVP_2/RVT_1/rve
super1_310462_317345 6884 RVT_1/rve
super1_371861_386288 14428 RVT_3
super1_399520_406675 7156 RVP_2/RVT_1/Chromo
super1_436013_445837 9825 Retrotran_gag_2/rve
super1_470886_473993 3108 Retrotran_gag_2/zf-CCHC
super1_507714_519214 11501 Retrotrans_gag/DUF659
super1_525959_531995 6037 Retrotran_gag_2/gag_pre-integrs/rve/RVT_2
super1_533502_547347 13846 zf-CCHC
super1_572981_579149 6169 Retrotrans_gag/gag-asp_proteas/Asp_protease_2/RVP_2/rve/Chromo
super1_596192_602055 5864 RVT_2
super1_617483_626724 9242 Asp_protease_2/gag-asp_proteas/RVP_2/RVT_1/rve/Chromo
super1_646356_649745 3390 Retrotran_gag_2/zf-CCHC
super1_657074_663210 6137 Retrotran_gag_2/gag_pre-integrs/rve/RVT_2
super1_663995_670109 6115 RVT_1/Chromo
super1_671390_674778 3389 Retrotran_gag_2/zf-CCHC
super1_725051_729096 4046 Asp_protease_2/gag-asp_proteas/RVP_2/RVT_1
super1_736512_740032 3521 Retrotran_gag_2/zf-CCHC
super1_781549_796535 14987 Retrotran_gag_2
super1_803016_813795 10780 Retrotran_gag_2/RVT_2/RVT_1/Chromo
super1_818390_823335 4946 gag_pre-integrs/rve/RVT_2
super1_824710_830397 5688 Retrotran_gag_2/gag_pre-integrs/rve/RVT_2
super1_894475_898077 3603 Retrotran_gag_2/zf-CCHC
super1_923458_926812 3355 Retrotran_gag_2/zf-CCHC_2/zf-CCHC
super1_929277_936403 7127 Retrotran_gag_2/zf-CCHC/rve/RVT_2
super1_957656_963701 6046 DUF4219/zf-CCHC/gag_pre-integrs/rve/RVT_2
super1_967461_973479 6019 Retrotran_gag_2/zf-CCHC/gag_pre-integrs/rve/RVT_2
$ awk 'FNR==NR{b[$1];next}{t=split($3,d,"/");for(n=1;n<=t;n+=1)if(!(d[n] in b))next}1' b.txt a.txt
super1_35231_42804 7574 gag_pre-integrs/RVT_2/Retrotran_gag_2/rve
super1_48918_54312 5395 Retrotran_gag_2/gag_pre-integrs/rve/RVT_2
super1_71681_76173 4493 Retrotran_gag_2
super1_192233_199678 7446 Retrotrans_gag/Asp_protease_2/gag-asp_proteas/RVP_2/RVT_1/rve/Chromo
super1_216492_223313 6822 Retrotrans_gag
super1_230561_235028 4468 Retrotran_gag_2/zf-CCHC/zf-CCHC_4
super1_291428_302513 11086 Retrotrans_gag/RVP_2/RVT_1/rve
super1_310462_317345 6884 RVT_1/rve
super1_371861_386288 14428 RVT_3
super1_399520_406675 7156 RVP_2/RVT_1/Chromo
super1_436013_445837 9825 Retrotran_gag_2/rve
super1_470886_473993 3108 Retrotran_gag_2/zf-CCHC
super1_525959_531995 6037 Retrotran_gag_2/gag_pre-integrs/rve/RVT_2
super1_533502_547347 13846 zf-CCHC
super1_572981_579149 6169 Retrotrans_gag/gag-asp_proteas/Asp_protease_2/RVP_2/rve/Chromo
super1_596192_602055 5864 RVT_2
super1_617483_626724 9242 Asp_protease_2/gag-asp_proteas/RVP_2/RVT_1/rve/Chromo
super1_646356_649745 3390 Retrotran_gag_2/zf-CCHC
super1_657074_663210 6137 Retrotran_gag_2/gag_pre-integrs/rve/RVT_2
super1_663995_670109 6115 RVT_1/Chromo
super1_671390_674778 3389 Retrotran_gag_2/zf-CCHC
super1_725051_729096 4046 Asp_protease_2/gag-asp_proteas/RVP_2/RVT_1
super1_736512_740032 3521 Retrotran_gag_2/zf-CCHC
super1_781549_796535 14987 Retrotran_gag_2
super1_803016_813795 10780 Retrotran_gag_2/RVT_2/RVT_1/Chromo
super1_818390_823335 4946 gag_pre-integrs/rve/RVT_2
super1_824710_830397 5688 Retrotran_gag_2/gag_pre-integrs/rve/RVT_2
super1_894475_898077 3603 Retrotran_gag_2/zf-CCHC
super1_923458_926812 3355 Retrotran_gag_2/zf-CCHC_2/zf-CCHC
super1_929277_936403 7127 Retrotran_gag_2/zf-CCHC/rve/RVT_2
super1_957656_963701 6046 DUF4219/zf-CCHC/gag_pre-integrs/rve/RVT_2
super1_967461_973479 6019 Retrotran_gag_2/zf-CCHC/gag_pre-integrs/rve/RVT_2
|
|