common/tools/sortUnique.pl
author Brendan Donegan brendand@symbian.org
Mon, 21 Sep 2009 16:17:41 +0100
changeset 479 b6c4098af3f0
parent 246 4f2482f1dd48
child 1316 0b4a09013baf
permissions -rw-r--r--
added my machine
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
246
4f2482f1dd48 Added sorting and removal of duplicates from TSV files.
Simon Howkins <simonh@symbian.org>
parents:
diff changeset
     1
#!perl -w
4f2482f1dd48 Added sorting and removal of duplicates from TSV files.
Simon Howkins <simonh@symbian.org>
parents:
diff changeset
     2
use strict;
4f2482f1dd48 Added sorting and removal of duplicates from TSV files.
Simon Howkins <simonh@symbian.org>
parents:
diff changeset
     3
# Sorts the input, removes duplicates, and outputs it
4f2482f1dd48 Added sorting and removal of duplicates from TSV files.
Simon Howkins <simonh@symbian.org>
parents:
diff changeset
     4
4f2482f1dd48 Added sorting and removal of duplicates from TSV files.
Simon Howkins <simonh@symbian.org>
parents:
diff changeset
     5
# Read it
4f2482f1dd48 Added sorting and removal of duplicates from TSV files.
Simon Howkins <simonh@symbian.org>
parents:
diff changeset
     6
my @content = <>;
4f2482f1dd48 Added sorting and removal of duplicates from TSV files.
Simon Howkins <simonh@symbian.org>
parents:
diff changeset
     7
4f2482f1dd48 Added sorting and removal of duplicates from TSV files.
Simon Howkins <simonh@symbian.org>
parents:
diff changeset
     8
# Sort it, and grep to remove duplicates
4f2482f1dd48 Added sorting and removal of duplicates from TSV files.
Simon Howkins <simonh@symbian.org>
parents:
diff changeset
     9
my $previous = "\n\n";
4f2482f1dd48 Added sorting and removal of duplicates from TSV files.
Simon Howkins <simonh@symbian.org>
parents:
diff changeset
    10
@content = grep {$_ ne $previous && ($previous = $_, 1) } sort @content;
4f2482f1dd48 Added sorting and removal of duplicates from TSV files.
Simon Howkins <simonh@symbian.org>
parents:
diff changeset
    11
4f2482f1dd48 Added sorting and removal of duplicates from TSV files.
Simon Howkins <simonh@symbian.org>
parents:
diff changeset
    12
# Write it
4f2482f1dd48 Added sorting and removal of duplicates from TSV files.
Simon Howkins <simonh@symbian.org>
parents:
diff changeset
    13
print @content;