author | Simon Howkins <simonh@symbian.org> |
Thu, 20 Aug 2009 12:49:47 +0100 | |
changeset 371 | fcb6057a8009 |
parent 231 | 4f2482f1dd48 |
permissions | -rw-r--r-- |
231
4f2482f1dd48
Added sorting and removal of duplicates from TSV files.
Simon Howkins <simonh@symbian.org>
parents:
diff
changeset
|
1 |
#!perl -w |
4f2482f1dd48
Added sorting and removal of duplicates from TSV files.
Simon Howkins <simonh@symbian.org>
parents:
diff
changeset
|
2 |
use strict; |
4f2482f1dd48
Added sorting and removal of duplicates from TSV files.
Simon Howkins <simonh@symbian.org>
parents:
diff
changeset
|
3 |
# Sorts the input, removes duplicates, and outputs it |
4f2482f1dd48
Added sorting and removal of duplicates from TSV files.
Simon Howkins <simonh@symbian.org>
parents:
diff
changeset
|
4 |
|
4f2482f1dd48
Added sorting and removal of duplicates from TSV files.
Simon Howkins <simonh@symbian.org>
parents:
diff
changeset
|
5 |
# Read it |
4f2482f1dd48
Added sorting and removal of duplicates from TSV files.
Simon Howkins <simonh@symbian.org>
parents:
diff
changeset
|
6 |
my @content = <>; |
4f2482f1dd48
Added sorting and removal of duplicates from TSV files.
Simon Howkins <simonh@symbian.org>
parents:
diff
changeset
|
7 |
|
4f2482f1dd48
Added sorting and removal of duplicates from TSV files.
Simon Howkins <simonh@symbian.org>
parents:
diff
changeset
|
8 |
# Sort it, and grep to remove duplicates |
4f2482f1dd48
Added sorting and removal of duplicates from TSV files.
Simon Howkins <simonh@symbian.org>
parents:
diff
changeset
|
9 |
my $previous = "\n\n"; |
4f2482f1dd48
Added sorting and removal of duplicates from TSV files.
Simon Howkins <simonh@symbian.org>
parents:
diff
changeset
|
10 |
@content = grep {$_ ne $previous && ($previous = $_, 1) } sort @content; |
4f2482f1dd48
Added sorting and removal of duplicates from TSV files.
Simon Howkins <simonh@symbian.org>
parents:
diff
changeset
|
11 |
|
4f2482f1dd48
Added sorting and removal of duplicates from TSV files.
Simon Howkins <simonh@symbian.org>
parents:
diff
changeset
|
12 |
# Write it |
4f2482f1dd48
Added sorting and removal of duplicates from TSV files.
Simon Howkins <simonh@symbian.org>
parents:
diff
changeset
|
13 |
print @content; |