From 2e45ec63199377039f1552ed85a2d80fc80d958f Mon Sep 17 00:00:00 2001 From: Mike Ryan Date: Fri, 18 Mar 2016 20:48:48 -0700 Subject: [PATCH] tools: make parse_companies.pl more forgiving of weird HTML Several company identifier lines do not end in a but rather
followed by newline followed by . This dirty hack is more forgiving of HTML weirdnesses in the SIGs company identifiers page. --- tools/parse_companies.pl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tools/parse_companies.pl b/tools/parse_companies.pl index 6dc358ee0..1746222da 100755 --- a/tools/parse_companies.pl +++ b/tools/parse_companies.pl @@ -45,7 +45,7 @@ while (<>) { $next_is_name = 1; # next should be company name - } elsif ($next_is_name && m|\(.*)\|) { + } elsif ($next_is_name && m|\(.*)\<|) { my $name = uri_decode($1); $name =~ s/^\s+//g; # kill leading $name =~ s/\s+$//g; # and trailing space -- 2.47.3