Hi all,
I wud like to get ur assistance in retrieving lines containing l1.My excel dataset contains around 8000 lines.I converted it into a text tab delimiter file and got the lines containing l1,My output is a list of lines containing l1 saved in a outfile.Some of d lines from my outfile s shown below;
"NM_001354","chr10","-",5021965,5050207,"Y","LINE,LTR,","L1,MaLR,","+,-,","5039541,5050000,","5039749,5050345,","5'UTR,5'UTR,"
"NM_001494","chr10","-",5847192,5895379,"N","LINE,","L1,","+,","5850340,","5850974,","5'UTR,"
"NM_012311","chr10","-",7837373,7869950,"N","LINE,","L1,","+,","7837122,","7837639,","3'UTR,"
"NM_001033855","chr10","-",14988878,15036100,"N","SINE,LINE,SINE,SINE,LINE,","Alu,L1,Alu,Alu,L1,","-,-,-,-,-,","14988880,14989317,14989863,14990031,14990305,","14989154,14989863,14990030,14990305,14990395,","3'UTR,3'UTR,3'UTR,3'UTR,3'UTR,"
"NM_001033855","chr10","-",14988878,15036100,"N","SINE,LINE,SINE,SINE,LINE,","Alu,L1,Alu,Alu,L1,","-,-,-,-,-,","14988880,14989317,14989863,14990031,14990305,","14989154,14989863,14990030,14990305,14990395,","3'UTR,3'UTR,3'UTR,3'UTR,3'UTR,"
"NM_001033857","chr10","-",14988878,15036100,"N","SINE,LINE,SINE,SINE,LINE,SINE,","Alu,L1,Alu,Alu,L1,MIR,","-,-,-,-,-,+,","14988880,14989317,14989863,14990031,14990305,15029509,","14989154,14989863,14990030,14990305,14990395,15029704,","3'UTR,3'UTR,3'UTR,3'UTR,3'UTR,5'UTR,""NM_001354","chr10","-",5021965,5050207,"Y","LINE,LTR,","L1,MaLR,","+,-,","5039541,5050000,","5039749,5050345,","5'UTR,5'UTR,"
"NM_001494","chr10","-",5847192,5895379,"N","LINE,","L1,","+,","5850340,","5850974,","5'UTR,"
"NM_012311","chr10","-",7837373,7869950,"N","LINE,","L1,","+,","7837122,","7837639,","3'UTR,"
"NM_001033855","chr10","-",14988878,15036100,"N","SINE,LINE,SINE,SINE,LINE,","Alu,L1,Alu,Alu,L1,","-,-,-,-,-,","14988880,14989317,14989863,14990031,14990305,","14989154,14989863,14990030,14990305,14990395,","3'UTR,3'UTR,3'UTR,3'UTR,3'UTR,"
"NM_001033855","chr10","-",14988878,15036100,"N","SINE,LINE,SINE,SINE,LINE,","Alu,L1,Alu,Alu,L1,","-,-,-,-,-,","14988880,14989317,14989863,14990031,14990305,","14989154,14989863,14990030,14990305,14990395,","3'UTR,3'UTR,3'UTR,3'UTR,3'UTR,"
"NM_001033857","chr10","-",14988878,15036100,"N","SINE,LINE,SINE,SINE,LINE,SINE,","Alu,L1,Alu,Alu,L1,MIR,","-,-,-,-,-,+,","14988880,14989317,14989863,14990031,14990305,15029509,","14989154,14989863,14990030,14990305,14990395,15029704,","3'UTR,3'UTR,3'UTR,3'UTR,3'UTR,5'UTR,"
You may notice some lines containing only "L1," and some lines containing "L1,MaLR," and so on.I would like to retrieve the lines containing only "L1,"into a separate outfile and the other lines into another outfile.I need a regular expression for matching this.
Thank you,
Regards,
Sayee.
---------- Post updated at 10:13 PM ---------- Previous update was at 10:09 PM ----------
Sorry friends,
I need to parse the data using perl!!!