#!/usr/bin/perl use strict; my (@field, $lastpaper, $paperbefore, $lastuser); my $dupe=0; while( ){ @field=split; if( $lastuser ne $field[0] ){ # between users $lastpaper=""; $paperbefore=""; } $lastuser=$field[0]; # get the unique paper id my ($paperfield, $papernum); ($papernum)=/(\d{7})/; if( $field[6]=~/papers/ ){ ($paperfield)=/\/ftp\/([\w-]+)\.?.*\/papers/; } else { ($paperfield)=/\/.*\/([\w-]+)\.?.*\/\??\d{7}/; } my ($paper)=$paperfield."/".$papernum; if( $paper ne $lastpaper && $paper ne $paperbefore ){ print"@field\n"; $paperbefore=$lastpaper; $lastpaper=$paper; } else { $dupe++; } } print STDERR "$dupe\n";