# DTU_ORBIT_rip - version 07.06.2017 kl. 08.17 # Udtrækker poster fra DTU's ORBIT-base HTML-kildekode use strict; use warnings; my $file = $ARGV[0]; open(INPUT, $file) or die("Input file $file not found.\n"); my $output = $ARGV[1]; open(OUTPUT, '>'.$output) or die "Can't create $output.\n"; open TEMP, "+>temp2.txt" or die $!; while(my $line = ) { $line =~ s|\n| |ig; #erstat linieskift med blanktegn overalt i input-fil $line =~ s|\t| |ig; #erstat TAB med blanktegn overalt i input-fil $line =~ s|(.*?)|$1|ig; $line =~ s|
||ig; print TEMP $line; } print "Empty lines and TABs removed\n\n"; close(TEMP); open(TEMP2, "