From 98358e8df3134a67aeb495edeb62310168083252 Mon Sep 17 00:00:00 2001 From: Andrew Yates <ayates@ebi.ac.uk> Date: Wed, 12 Sep 2012 15:02:28 +0000 Subject: [PATCH] Fix for parsing files from Ken @ CSHL. ORIGIN was used in another context apart from notifying the start of the sequence in a genbank a.thaliana file --- misc-scripts/xref_mapping/XrefParser/RefSeqGPFFParser.pm | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/misc-scripts/xref_mapping/XrefParser/RefSeqGPFFParser.pm b/misc-scripts/xref_mapping/XrefParser/RefSeqGPFFParser.pm index 7e1d7aa610..b7c2c9336a 100644 --- a/misc-scripts/xref_mapping/XrefParser/RefSeqGPFFParser.pm +++ b/misc-scripts/xref_mapping/XrefParser/RefSeqGPFFParser.pm @@ -223,7 +223,7 @@ sub create_xrefs { $description =~ s/\s+/ /g; $description = substr($description, 0, 255) if (length($description) > 255); - my ($seq) = $_ =~ /ORIGIN\s+(.+)/s; # /s allows . to match newline + my ($seq) = $_ =~ /^\s*ORIGIN\s+(.+)/ms; # /s allows . to match newline my @seq_lines = split /\n/, $seq; my $parsed_seq = ""; foreach my $x (@seq_lines) { -- GitLab