From a8955c54d2b335fdd4ccd7aa07b876e92d24a462 Mon Sep 17 00:00:00 2001 From: sandho0000 <michael.sandholzer@unibas.ch> Date: Wed, 9 Nov 2022 14:20:40 +0100 Subject: [PATCH] new file: read_sequencer_package/read_in_FASTA.py --- read_sequencer_package/read_in_FASTA.py | 26 +++++++++++++++++++++++++ 1 file changed, 26 insertions(+) create mode 100644 read_sequencer_package/read_in_FASTA.py diff --git a/read_sequencer_package/read_in_FASTA.py b/read_sequencer_package/read_in_FASTA.py new file mode 100644 index 0000000..21ec810 --- /dev/null +++ b/read_sequencer_package/read_in_FASTA.py @@ -0,0 +1,26 @@ +''' +This function reads in FASTA files + +argument is file_path + +it returns a dictionary with the sequences + + +''' + + +import sys + +def read_in_fasta(file_path): + sequences = {} + f = open(file_path) + for line in f: + if line[0] == '>': + defline = line.srtip() + defline = defline.replace('>', '') + else: + if defline not in sequences: + sequences[defline] = '' + sequences[defline] += line.strip() + return sequences + -- GitLab