代码说明:

fasta格式的蛋白质序列,一个txt里面有很多蛋白质序列,计算ss、pssm或disorder score时候都需要单条计算,需要分开。

分割前:

【BioCode】将多个蛋白质序列分成单个的txt文档-LMLPHP

分割后:

【BioCode】将多个蛋白质序列分成单个的txt文档-LMLPHP

show you the code:

package single;

import java.io.BufferedReader;
import java.io.FileNotFoundException;
import java.io.FileReader;
import java.io.*;
import java.io.IOException;
//将整个文件分成单个的TXT文件
public class Single {
public static void getTxt(String path) throws IOException {
try {
FileReader reader = new FileReader(path);
BufferedReader br = new BufferedReader(reader);
String str = null;
String str1 = null;
int count = 0;
while ((str = br.readLine()) != null) {
System.out.println(str);
str1 = br.readLine();
count++;
//E:\experiment----N-formylated\single
FileWriter fileWritter = new FileWriter("E:\\experiment--help\\linglingbao\\new-single\\" + count + ".txt");//使用数字对每个txt编号
BufferedWriter bufferWritter = new BufferedWriter(fileWritter);
bufferWritter.write(str+"\n");
bufferWritter.write(str1);
bufferWritter.flush();
}
System.out.println(count);
br.close();
reader.close();
} catch (FileNotFoundException e) {
// TODO Auto-generated catch block
e.printStackTrace();
}
} public static void main(String[] args) { String path = "E:\\experiment--help\\linglingbao\\new-single\\seq.txt";
try {
getTxt(path);
} catch (IOException e) {
// TODO Auto-generated catch block
e.printStackTrace();
}
}
}
05-14 11:56