2007-10-23 23:14:03 +02:00
|
|
|
#! /usr/bin/env perl
|
2006-12-17 17:36:17 +01:00
|
|
|
#
|
2007-06-06 10:37:35 +02:00
|
|
|
#
|
2006-12-17 17:36:17 +01:00
|
|
|
#
|
2007-11-28 15:28:46 +01:00
|
|
|
# Funambol is a mobile platform developed by Funambol, Inc.
|
|
|
|
# Copyright (C) 2003 - 2007 Funambol, Inc.
|
|
|
|
#
|
|
|
|
# This program is free software; you can redistribute it and/or modify it under
|
|
|
|
# the terms of the GNU Affero General Public License version 3 as published by
|
|
|
|
# the Free Software Foundation with the addition of the following permission
|
|
|
|
# added to Section 15 as permitted in Section 7(a): FOR ANY PART OF THE COVERED
|
|
|
|
# WORK IN WHICH THE COPYRIGHT IS OWNED BY FUNAMBOL, FUNAMBOL DISCLAIMS THE
|
|
|
|
# WARRANTY OF NON INFRINGEMENT OF THIRD PARTY RIGHTS.
|
|
|
|
#
|
|
|
|
# This program is distributed in the hope that it will be useful, but WITHOUT
|
|
|
|
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
|
|
|
|
# FOR A PARTICULAR PURPOSE. See the GNU General Public License for more
|
|
|
|
# details.
|
|
|
|
#
|
|
|
|
# You should have received a copy of the GNU Affero General Public License
|
|
|
|
# along with this program; if not, see http://www.gnu.org/licenses or write to
|
|
|
|
# the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
|
|
|
|
# MA 02110-1301 USA.
|
|
|
|
#
|
|
|
|
# You can contact Funambol, Inc. headquarters at 643 Bair Island Road, Suite
|
|
|
|
# 305, Redwood City, CA 94063, USA, or at email address info@funambol.com.
|
|
|
|
#
|
|
|
|
# The interactive user interfaces in modified source and object code versions
|
|
|
|
# of this program must display Appropriate Legal Notices, as required under
|
|
|
|
# Section 5 of the GNU Affero General Public License version 3.
|
|
|
|
#
|
|
|
|
# In accordance with Section 7(b) of the GNU Affero General Public License
|
|
|
|
# version 3, these Appropriate Legal Notices must retain the display of the
|
|
|
|
# "Powered by Funambol" logo. If the display of the logo is not reasonably
|
|
|
|
# feasible for technical reasons, the Appropriate Legal Notices must display
|
|
|
|
# the words "Powered by Funambol".
|
2006-12-17 17:36:17 +01:00
|
|
|
#
|
|
|
|
#
|
|
|
|
#
|
2007-11-08 21:56:37 +01:00
|
|
|
# Usage: <file>
|
|
|
|
# <left file> <right file>
|
|
|
|
# Either normalizes a file or compares two of them in a side-by-side
|
|
|
|
# diff.
|
|
|
|
#
|
|
|
|
# Checks environment variables:
|
|
|
|
#
|
|
|
|
# CLIENT_TEST_SERVER=funambol|scheduleworld|egroupware|synthesis
|
|
|
|
# Enables code which simplifies the text files just like
|
|
|
|
# certain well-known servers do. This is useful for testing
|
|
|
|
# to ignore the data loss introduced by these servers or (for
|
|
|
|
# users) to simulate the effect of these servers on their data.
|
|
|
|
#
|
|
|
|
# CLIENT_TEST_CLIENT=evolution|addressbook (Mac OS X/iPhone)
|
|
|
|
# Same as for servers this replicates the effect of storing
|
|
|
|
# data in the clients.
|
|
|
|
#
|
|
|
|
# CLIENT_TEST_LEFT_NAME="before sync"
|
|
|
|
# CLIENT_TEST_RIGHT_NAME="after sync"
|
|
|
|
# CLIENT_TEST_REMOVED="removed during sync"
|
|
|
|
# CLIENT_TEST_ADDED="added during sync"
|
|
|
|
# Setting these variables changes the default legend
|
|
|
|
# print above the left and right file during a
|
|
|
|
# comparison.
|
|
|
|
#
|
|
|
|
# CLIENT_TEST_COMPARISON_FAILED=1
|
|
|
|
# Overrides the default error code when changes are found.
|
|
|
|
|
2006-12-17 17:36:17 +01:00
|
|
|
|
|
|
|
use strict;
|
|
|
|
use encoding 'utf8';
|
2007-03-29 22:39:54 +02:00
|
|
|
use Algorithm::Diff;
|
2006-12-17 17:36:17 +01:00
|
|
|
|
2007-10-23 23:14:03 +02:00
|
|
|
# ignore differences caused by specific servers or local backends?
|
2006-12-20 22:34:51 +01:00
|
|
|
my $server = $ENV{CLIENT_TEST_SERVER} || "funambol";
|
2007-10-23 23:14:03 +02:00
|
|
|
my $client = $ENV{CLIENT_TEST_CLIENT} || "evolution";
|
2006-12-17 17:36:17 +01:00
|
|
|
my $scheduleworld = $server =~ /scheduleworld/;
|
|
|
|
my $synthesis = $server =~ /synthesis/;
|
|
|
|
my $egroupware = $server =~ /egroupware/;
|
|
|
|
my $funambol = $server =~ /funambol/;
|
2007-10-23 23:14:03 +02:00
|
|
|
my $evolution = $client =~ /evolution/;
|
|
|
|
my $addressbook = $client =~ /addressbook/;
|
2006-12-17 17:36:17 +01:00
|
|
|
|
|
|
|
sub Usage {
|
|
|
|
print "$0 <vcards.vcf\n";
|
|
|
|
print " normalizes one file (stdin or single argument), prints to stdout\n";
|
|
|
|
print "$0 vcards1.vcf vcards2.vcf\n";
|
|
|
|
print " compares the two files\n";
|
|
|
|
print "Also works for iCalendar files.\n";
|
|
|
|
}
|
|
|
|
|
2007-11-30 23:44:51 +01:00
|
|
|
sub uppercase {
|
|
|
|
my $text = shift;
|
|
|
|
$text =~ tr/a-z/A-Z/;
|
|
|
|
return $text;
|
|
|
|
}
|
|
|
|
|
2007-03-29 22:39:54 +02:00
|
|
|
# parameters: file handle with input, width to use for reformatted lines
|
|
|
|
# returns list of lines without line breaks
|
2006-12-17 17:36:17 +01:00
|
|
|
sub Normalize {
|
|
|
|
my $in = shift;
|
|
|
|
my $width = shift;
|
|
|
|
|
|
|
|
$_ = join( "", <$in> );
|
|
|
|
s/\r//g;
|
|
|
|
|
|
|
|
my @items = ();
|
|
|
|
|
|
|
|
foreach $_ ( split( /(?:(?<=\nEND:VCARD)|(?<=\nEND:VCALENDAR))\n*/ ) ) {
|
|
|
|
# undo line continuation
|
|
|
|
s/\n\s//gs;
|
|
|
|
# ignore charset specifications, assume UTF-8
|
|
|
|
s/;CHARSET="?UTF-8"?//g;
|
|
|
|
|
2007-04-15 15:16:17 +02:00
|
|
|
# UID may differ, but only in vCards and journal entries:
|
|
|
|
# in calendar events the UID needs to be preserved to handle
|
|
|
|
# meeting invitations/replies correctly
|
|
|
|
s/((VCARD|VJOURNAL).*)^UID:[^\n]*\n/$1/msg;
|
2006-12-17 17:36:17 +01:00
|
|
|
|
2007-02-11 12:11:34 +01:00
|
|
|
# expand <foo> shortcuts to TYPE=<foo>
|
|
|
|
while (s/^(ADR|EMAIL|TEL)([^:\n]*);(HOME|OTHER|WORK|PARCEL|INTERNET|CAR|VOICE|CELL|PAGER)/$1;TYPE=$3/mg) {}
|
|
|
|
|
2006-12-17 17:36:17 +01:00
|
|
|
# the distinction between an empty and a missing property
|
|
|
|
# is vague and handled differently, so ignore empty properties
|
|
|
|
s/^[^:\n]*:;*\n//mg;
|
|
|
|
|
|
|
|
# use separate TYPE= fields
|
2007-12-08 18:42:58 +01:00
|
|
|
while( s/^(\w*[^:\n]*);TYPE=(\w*),(\w*)/$1;TYPE=$2;TYPE=$3/mg ) {}
|
2006-12-17 17:36:17 +01:00
|
|
|
|
2007-12-08 18:42:58 +01:00
|
|
|
# make TYPE uppercase (in vCard 3.0 at least those parameters are case-insensitive)
|
|
|
|
while( s/^(\w*[^:\n]*);TYPE=(\w*?[a-z]\w*?)([;:])/ $1 . ";TYPE=" . uppercase($2) . $3 /mge ) {}
|
|
|
|
|
|
|
|
# replace parameters with a sorted parameter list
|
|
|
|
s!^([^;:\n]*);(.*?):!$1 . ";" . join(';',sort(split(/;/, $2))) . ":"!meg;
|
2006-12-17 17:36:17 +01:00
|
|
|
|
|
|
|
# Map non-standard ADR;TYPE=OTHER to PARCEL, just like SyncEvolution does
|
|
|
|
s/^ADR;TYPE=OTHER/ADR;TYPE=PARCEL/mg;
|
|
|
|
# Ignore remaining "other" email, address and telephone type - this is
|
|
|
|
# an Evolution specific extension which might not be preserved.
|
|
|
|
s/^(ADR|EMAIL|TEL)([^:\n]*);TYPE=OTHER/$1$2/mg;
|
|
|
|
# TYPE=PREF on the other hand is not used by Evolution, but
|
|
|
|
# might be sent back.
|
|
|
|
s/^(ADR|EMAIL)([^:\n]*);TYPE=PREF/$1$2/mg;
|
|
|
|
# Evolution does not need TYPE=INTERNET for email
|
|
|
|
s/^(EMAIL)([^:\n]*);TYPE=INTERNET/$1$2/mg;
|
|
|
|
# ignore TYPE=PREF in address, does not matter in Evolution
|
|
|
|
s/^((ADR|LABEL)[^:\n]*);TYPE=PREF/$1/mg;
|
|
|
|
# ignore extra separators in multi-value fields
|
|
|
|
s/^((ORG|N|(ADR[^:\n]*?)):.*?);*$/$1/mg;
|
|
|
|
# the type of certain fields is ignore by Evolution
|
|
|
|
s/^X-(AIM|GROUPWISE|ICQ|YAHOO);TYPE=HOME/X-$1/gm;
|
|
|
|
# Evolution ignores an additional pager type
|
|
|
|
s/^TEL;TYPE=PAGER;TYPE=WORK/TEL;TYPE=PAGER/gm;
|
|
|
|
# PAGER property is sent by Evolution, but otherwise ignored
|
|
|
|
s/^LABEL[;:].*\n//mg;
|
|
|
|
# TYPE=VOICE is the default in Evolution and may or may not appear in the vcard;
|
|
|
|
# this simplification is a bit too agressive and hides the problematic
|
|
|
|
# TYPE=PREF,VOICE combination which Evolution does not handle :-/
|
|
|
|
s/^TEL([^:\n]*);TYPE=VOICE,([^:\n]*):/TEL$1;TYPE=$2:/mg;
|
|
|
|
s/^TEL([^:\n]*);TYPE=([^;:\n]*),VOICE([^:\n]*):/TEL$1;TYPE=$2$3:/mg;
|
|
|
|
s/^TEL([^:\n]*);TYPE=VOICE([^:\n]*):/TEL$1$2:/mg;
|
|
|
|
# don't care about the TYPE property of PHOTOs
|
|
|
|
s/^PHOTO;(.*)TYPE=[A-Z]*/PHOTO;$1/mg;
|
|
|
|
# encoding is not case sensitive, skip white space in the middle of binary data
|
|
|
|
if (s/^PHOTO;.*?ENCODING=(b|B|BASE64).*?:\s*/PHOTO;ENCODING=B: /mgi) {
|
|
|
|
while (s/^PHOTO(.*?): (\S+)[\t ]+(\S+)/PHOTO$1: $2$3/mg) {}
|
|
|
|
}
|
|
|
|
# ignore extra day factor in front of weekday
|
|
|
|
s/^RRULE:(.*)BYDAY=\+?1(\D)/RRULE:$1BYDAY=$2/mg;
|
|
|
|
# remove default VALUE=DATE-TIME
|
|
|
|
s/^(DTSTART|DTEND)([^:\n]*);VALUE=DATE-TIME/$1$2/mg;
|
|
|
|
|
|
|
|
# remove fields which may differ
|
|
|
|
s/^(PRODID|CREATED|DTSTAMP|LAST-MODIFIED|REV):.*\r?\n?//gm;
|
|
|
|
# remove optional fields
|
2007-06-14 22:40:45 +02:00
|
|
|
s/^(METHOD|X-WSS-[A-Z]*):.*\r?\n?//gm;
|
2006-12-17 17:36:17 +01:00
|
|
|
|
2007-12-09 18:12:53 +01:00
|
|
|
# trailing line break(s) in a DESCRIPTION may or may not be
|
|
|
|
# removed or added by servers
|
|
|
|
s/^DESCRIPTION:(.*?)(\\n)+$/DESCRIPTION:$1/gm;
|
|
|
|
|
2007-11-07 22:30:36 +01:00
|
|
|
if ($scheduleworld || $egroupware || $synthesis || $addressbook || $funambol) {
|
2006-12-17 17:36:17 +01:00
|
|
|
# does not preserve X-EVOLUTION-UI-SLOT=
|
|
|
|
s/^(\w+)([^:\n]*);X-EVOLUTION-UI-SLOT=\d+/$1$2/mg;
|
|
|
|
}
|
|
|
|
|
|
|
|
if ($scheduleworld) {
|
|
|
|
# cannot distinguish EMAIL types
|
|
|
|
s/^EMAIL;TYPE=\w*/EMAIL/mg;
|
|
|
|
# replaces certain TZIDs with more up-to-date ones
|
|
|
|
s;TZID(=|:)/(scheduleworld.com|softwarestudio.org)/Olson_\d+_\d+/;TZID$1/foo.com/Olson_20000101_1/;mg;
|
|
|
|
}
|
|
|
|
|
2007-10-23 23:14:03 +02:00
|
|
|
if ($synthesis) {
|
2006-12-17 17:36:17 +01:00
|
|
|
# only preserves ORG "Company", but loses "Department" and "Office"
|
|
|
|
s/^ORG:([^;:\n]+)(;[^\n]*)/ORG:$1/mg;
|
|
|
|
}
|
|
|
|
|
2007-02-11 12:11:34 +01:00
|
|
|
if ($funambol) {
|
|
|
|
# only preserves ORG "Company";"Department", but loses "Office"
|
|
|
|
s/^ORG:([^;:\n]+)(;[^;:\n]*)(;[^\n]*)/ORG:$1$2/mg;
|
|
|
|
}
|
|
|
|
|
2007-11-07 22:30:36 +01:00
|
|
|
if ($funambol) {
|
|
|
|
# drops the second address line
|
|
|
|
s/^ADR(.*?):([^;]*?);[^;]*?;/ADR$1:$2;;/mg;
|
|
|
|
}
|
|
|
|
|
2007-10-23 23:14:03 +02:00
|
|
|
if ($addressbook) {
|
|
|
|
# some properties cannot be stored
|
|
|
|
s/^(X-MOZILLA-HTML|X-EVOLUTION-FILE-AS|X-EVOLUTION-ANNIVERSARY|X-EVOLUTION-BLOG-URL|X-EVOLUTION-VIDEO-URL|X-GROUPWISE|ROLE|CATEGORIES|FBURL|CALURI|FN)(;[^:;\n]*)*:.*\r?\n?//gm;
|
|
|
|
# only some parts of ADR are preserved
|
|
|
|
my $type;
|
|
|
|
s/^ADR(.*?)\:(.*)/$type=($1 || ""); @_ = split(\/(?<!\\);\/, $2); "ADR:;;" . ($_[2] || "") . ";" . ($_[3] || "") . ";" . ($_[4] || "") . ";" . ($_[5] || "") . ";" . ($_[6] || "")/gme;
|
|
|
|
# TYPE=CAR not supported
|
|
|
|
s/;TYPE=CAR//g;
|
|
|
|
}
|
|
|
|
|
2006-12-17 17:36:17 +01:00
|
|
|
if ($synthesis) {
|
|
|
|
# does not preserve certain properties
|
2008-02-10 17:02:51 +01:00
|
|
|
s/^(FN|BDAY|X-MOZILLA-HTML|X-EVOLUTION-FILE-AS|X-AIM|NICKNAME|PHOTO|CALURI|SEQUENCE|TRANSP|ORGANIZER)(;[^:;\n]*)*:.*\r?\n?//gm;
|
2006-12-17 17:36:17 +01:00
|
|
|
# default ADR is HOME
|
|
|
|
s/^ADR;TYPE=HOME/ADR/gm;
|
|
|
|
# only some parts of N are preserved
|
2008-02-03 11:59:11 +01:00
|
|
|
s/^N((?:;[^;:]*)*)\:(.*)/@_ = split(\/(?<!\\);\/, $2); "N$1:$_[0];" . ($_[1] || "") . ";;" . ($_[3] || "")/gme;
|
2006-12-17 17:36:17 +01:00
|
|
|
# this vcard contains too many ADR and PHONE entries - ignore it
|
|
|
|
if (/This is a test case which uses almost all Evolution fields/) {
|
|
|
|
next;
|
|
|
|
}
|
2007-06-14 22:40:45 +02:00
|
|
|
# breaks lines at semicolons, which adds white space
|
|
|
|
while( s/^ADR:(.*); +/ADR:$1;/gm ) {}
|
2008-02-10 17:02:51 +01:00
|
|
|
# no attributes stored for ATTENDEEs
|
|
|
|
s/^ATTENDEE;.*?:/ATTENDEE:/msg;
|
|
|
|
}
|
|
|
|
|
|
|
|
if ($synthesis) {
|
|
|
|
# VALARM not supported
|
|
|
|
s/^BEGIN:VALARM.*?END:VALARM\r?\n?//msg;
|
2006-12-17 17:36:17 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
if ($egroupware) {
|
|
|
|
# CLASS:PUBLIC is added if none exists (as in our test cases),
|
|
|
|
# several properties not preserved
|
|
|
|
s/^(BDAY|CATEGORIES|FBURL|PHOTO|FN|X-[A-Z-]*|CALURI|CLASS|NICKNAME|UID|TRANSP|PRIORITY|SEQUENCE)(;[^:;\n]*)*:.*\r?\n?//gm;
|
|
|
|
# org gets truncated
|
|
|
|
s/^ORG:([^;:\n]*);.*/ORG:$1/gm;
|
|
|
|
}
|
|
|
|
|
|
|
|
if ($funambol) {
|
|
|
|
# several properties are not preserved
|
2007-11-07 22:30:36 +01:00
|
|
|
s/^(CALURI|FBURL|FN|PHOTO|X-EVOLUTION-ANNIVERSARY|X-MOZILLA-HTML|X-EVOLUTION-FILE-AS|X-AIM|X-EVOLUTION-ASSISTANT|X-EVOLUTION-BLOG-URL|X-EVOLUTION-MANAGER|X-EVOLUTION-SPOUSE|X-EVOLUTION-VIDEO-URL|X-GROUPWISE|X-ICQ|X-YAHOO)(;[^:;\n]*)*:.*\r?\n?//gm;
|
2007-02-11 12:11:34 +01:00
|
|
|
|
|
|
|
# quoted-printable line breaks are =0D=0A, not just single =0A
|
|
|
|
s/(?<!=0D)=0A/=0D=0A/g;
|
2007-11-07 22:30:36 +01:00
|
|
|
# only three email addresses, fourth one from test case gets lost
|
|
|
|
s/^EMAIL:john.doe\@yet.another.world\n\r?//mg;
|
|
|
|
# this particular type is not preserved
|
|
|
|
s/ADR;TYPE=PARCEL:Test Box #3/ADR;TYPE=HOME:Test Box #3/;
|
2006-12-17 17:36:17 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
if ($funambol || $egroupware) {
|
|
|
|
# NOTE may be truncated due to length resistrictions
|
|
|
|
s/^(NOTE(;[^:;\n]*)*:.{0,160}).*(\r?\n?)/$1$3/gm;
|
|
|
|
}
|
|
|
|
|
2007-05-08 21:32:16 +02:00
|
|
|
# treat X-MOZILLA-HTML=FALSE as if the property didn't exist
|
|
|
|
s/^X-MOZILLA-HTML:FALSE\r?\n?//gm;
|
|
|
|
|
2006-12-17 17:36:17 +01:00
|
|
|
my @formatted = ();
|
|
|
|
|
|
|
|
# Modify lines to cover not more than
|
|
|
|
# $width characters by folding lines (as done for the N or SUMMARY above),
|
|
|
|
# but also indent each inner BEGIN/END block by 2 spaces
|
|
|
|
# and finally sort the lines.
|
|
|
|
# We need to keep a stack of open blocks in @formatted:
|
|
|
|
# - BEGIN creates another open block
|
|
|
|
# - END closes it, sorts it, and adds as single string to the parent block
|
|
|
|
push @formatted, [];
|
|
|
|
foreach $_ (split /\n/, $_) {
|
|
|
|
if (/^BEGIN:/) {
|
|
|
|
# start a new block
|
|
|
|
push @formatted, [];
|
|
|
|
}
|
|
|
|
|
|
|
|
my $spaces = " " x ($#formatted - 1);
|
|
|
|
my $thiswidth = $width -1 - length($spaces);
|
|
|
|
$thiswidth = 1 if $thiswidth <= 0;
|
|
|
|
s/(.{$thiswidth})(?!$)/$1\n /g;
|
|
|
|
s/^(.*)$/$spaces$1/mg;
|
|
|
|
push @{$formatted[$#formatted]}, $_;
|
|
|
|
|
|
|
|
if (/^\s*END:/) {
|
|
|
|
my $block = pop @formatted;
|
|
|
|
my $begin = shift @{$block};
|
|
|
|
my $end = pop @{$block};
|
|
|
|
|
|
|
|
# Keep begin/end as first/last line,
|
|
|
|
# inbetween sort, but so that N or SUMMARY are
|
|
|
|
# at the top. This ensures that the order of items
|
|
|
|
# is the same, even if individual properties differ.
|
|
|
|
# Also put indented blocks at the end, not the top.
|
|
|
|
sub numspaces {
|
|
|
|
my $str = shift;
|
|
|
|
$str =~ /^(\s*)/;
|
|
|
|
return length($1);
|
|
|
|
}
|
|
|
|
$_ = join("\n",
|
|
|
|
$begin,
|
|
|
|
sort( { $a =~ /^\s*(N|SUMMARY):/ ? -1 :
|
|
|
|
$b =~ /^\s*(N|SUMMARY):/ ? 1 :
|
|
|
|
($a =~ /^\s/ && $b =~ /^\S/) ? 1 :
|
|
|
|
numspaces($a) == numspaces($b) ? $a cmp $b :
|
|
|
|
numspaces($a) - numspaces($b) }
|
|
|
|
@{$block} ),
|
|
|
|
$end);
|
|
|
|
push @{$formatted[$#formatted]}, $_;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
push @items, ${$formatted[0]}[0];
|
|
|
|
}
|
|
|
|
|
2007-03-29 22:39:54 +02:00
|
|
|
return split( /\n/, join( "\n\n", sort @items ));
|
2006-12-17 17:36:17 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
# number of columns available for output:
|
|
|
|
# try tput without printing the shells error if not found,
|
|
|
|
# default to 80
|
2007-04-02 20:57:19 +02:00
|
|
|
my $columns = `which tput >/dev/null 2>/dev/null && tput 2>/dev/null && tput cols`;
|
2006-12-17 17:36:17 +01:00
|
|
|
if ($? || !$columns) {
|
|
|
|
$columns = 80;
|
|
|
|
}
|
|
|
|
|
|
|
|
if($#ARGV > 1) {
|
|
|
|
# error
|
|
|
|
Usage();
|
|
|
|
exit 1;
|
|
|
|
} elsif($#ARGV == 1) {
|
|
|
|
# comparison
|
|
|
|
|
|
|
|
my ($file1, $file2) = ($ARGV[0], $ARGV[1]);
|
|
|
|
|
|
|
|
open(IN1, "<:utf8", $file1) || die "$file1: $!";
|
|
|
|
open(IN2, "<:utf8", $file2) || die "$file2: $!";
|
|
|
|
my $singlewidth = int(($columns - 3) / 2);
|
|
|
|
$columns = $singlewidth * 2 + 3;
|
2007-03-29 22:39:54 +02:00
|
|
|
my @normal1 = Normalize(*IN1{IO}, $singlewidth);
|
|
|
|
my @normal2 = Normalize(*IN2{IO}, $singlewidth);
|
2006-12-17 17:36:17 +01:00
|
|
|
close(IN1);
|
|
|
|
close(IN2);
|
|
|
|
|
|
|
|
# Produce output where each line is marked as old (aka remove) with o,
|
|
|
|
# as new (aka added) with n, and as unchanged with u at the beginning.
|
|
|
|
# This allows simpler processing below.
|
2007-03-29 22:39:54 +02:00
|
|
|
my $res = 0;
|
|
|
|
if (0) {
|
|
|
|
# $_ = `diff "--old-line-format=o %L" "--new-line-format=n %L" "--unchanged-line-format=u %L" "$normal1" "$normal2"`;
|
|
|
|
# $res = $?;
|
|
|
|
} else {
|
|
|
|
# convert into same format as diff above - this allows reusing the
|
|
|
|
# existing output formatting code
|
|
|
|
my $diffs_ref = Algorithm::Diff::sdiff(\@normal1, \@normal2);
|
|
|
|
@_ = ();
|
|
|
|
my $hunk;
|
|
|
|
foreach $hunk ( @{$diffs_ref} ) {
|
|
|
|
my ($type, $left, $right) = @{$hunk};
|
|
|
|
if ($type eq "-") {
|
|
|
|
push @_, "o $left";
|
|
|
|
$res = 1;
|
|
|
|
} elsif ($type eq "+") {
|
|
|
|
push @_, "n $right";
|
|
|
|
$res = 1;
|
|
|
|
} elsif ($type eq "c") {
|
|
|
|
push @_, "o $left";
|
|
|
|
push @_, "n $right";
|
|
|
|
$res = 1;
|
|
|
|
} else {
|
|
|
|
push @_, "u $left";
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
$_ = join("\n", @_);
|
|
|
|
}
|
2006-12-17 17:36:17 +01:00
|
|
|
|
|
|
|
if ($res) {
|
2007-11-08 21:56:37 +01:00
|
|
|
printf "%*s | %s\n", $singlewidth,
|
|
|
|
($ENV{CLIENT_TEST_LEFT_NAME} || "before sync"),
|
|
|
|
($ENV{CLIENT_TEST_RIGHT_NAME} || "after sync");
|
|
|
|
printf "%*s <\n", $singlewidth,
|
|
|
|
($ENV{CLIENT_TEST_REMOVED} || "removed during sync");
|
|
|
|
printf "%*s > %s\n", $singlewidth, "",
|
|
|
|
($ENV{CLIENT_TEST_ADDED} || "added during sync");
|
2007-03-29 22:39:54 +02:00
|
|
|
print "-" x $columns, "\n";
|
|
|
|
|
2006-12-17 17:36:17 +01:00
|
|
|
# fix confusing output like:
|
|
|
|
# BEGIN:VCARD BEGIN:VCARD
|
|
|
|
# > N:new;entry
|
|
|
|
# > FN:new
|
|
|
|
# > END:VCARD
|
|
|
|
# >
|
|
|
|
# > BEGIN:VCARD
|
|
|
|
# and replace it with:
|
|
|
|
# > BEGIN:VCARD
|
|
|
|
# > N:new;entry
|
|
|
|
# > FN:new
|
|
|
|
# > END:VCARD
|
|
|
|
#
|
|
|
|
# BEGIN:VCARD BEGIN:VCARD
|
|
|
|
#
|
|
|
|
# With the o/n/u markup this presents itself as:
|
|
|
|
# u BEGIN:VCARD
|
|
|
|
# n N:new;entry
|
|
|
|
# n FN:new
|
|
|
|
# n END:VCARD
|
|
|
|
# n
|
|
|
|
# n BEGIN:VCARD
|
|
|
|
#
|
2007-03-29 22:39:54 +02:00
|
|
|
# The alternative case is also possible:
|
|
|
|
# o END:VCARD
|
|
|
|
# o
|
|
|
|
# o BEGIN:VCARD
|
|
|
|
# o N:old;entry
|
|
|
|
# u END:VCARD
|
|
|
|
|
|
|
|
# case one above
|
2006-12-17 17:36:17 +01:00
|
|
|
while( s/^u BEGIN:(VCARD|VCALENDAR)\n((?:^n .*\n)+?)^n BEGIN:/n BEGIN:$1\n$2u BEGIN:/m) {}
|
2007-03-29 22:39:54 +02:00
|
|
|
# same for the other direction
|
2006-12-17 17:36:17 +01:00
|
|
|
while( s/^u BEGIN:(VCARD|VCALENDAR)\n((?:^o .*\n)+?)^o BEGIN:/o BEGIN:$1\n$2u BEGIN:/m) {}
|
|
|
|
|
2007-03-29 22:39:54 +02:00
|
|
|
# case two
|
|
|
|
while( s/^o END:(VCARD|VCALENDAR)\n((?:^o .*\n)+?)^u END:/u END:$1\n$2o END:/m) {}
|
|
|
|
while( s/^n END:(VCARD|VCALENDAR)\n((?:^n .*\n)+?)^u END:/u END:$1\n$2n END:/m) {}
|
|
|
|
|
2006-12-17 17:36:17 +01:00
|
|
|
# split at end of each record
|
|
|
|
my $spaces = " " x $singlewidth;
|
|
|
|
foreach $_ (split /(?:(?<=. END:VCARD\n)|(?<=. END:VCALENDAR\n))(?:^. \n)*/m, $_) {
|
|
|
|
# ignore unchanged records
|
|
|
|
if (!length($_) || /^((u [^\n]*\n)*(u [^\n]*?))$/s) {
|
|
|
|
next;
|
|
|
|
}
|
|
|
|
|
|
|
|
# make all lines equally long in terms of printable characters
|
|
|
|
s/^(.*)$/$1 . (" " x ($singlewidth + 2 - length($1)))/gme;
|
|
|
|
|
|
|
|
# convert into side-by-side output
|
|
|
|
my @buffer = ();
|
|
|
|
foreach $_ (split /\n/, $_) {
|
|
|
|
if (/^u (.*)/) {
|
|
|
|
print join(" <\n", @buffer), " <\n" if $#buffer >= 0;
|
|
|
|
@buffer = ();
|
|
|
|
print $1, " ", $1, "\n";
|
|
|
|
} elsif (/^o (.*)/) {
|
|
|
|
# preserve in buffer for potential merging with "n "
|
|
|
|
push @buffer, $1;
|
|
|
|
} else {
|
|
|
|
/^n (.*)/;
|
|
|
|
# have line to be merged with?
|
|
|
|
if ($#buffer >= 0) {
|
|
|
|
print shift @buffer, " | ", $1, "\n";
|
|
|
|
} else {
|
|
|
|
print join(" <\n", @buffer), " <\n" if $#buffer >= 0;
|
|
|
|
print $spaces, " > ", $1, "\n";
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
print join(" <\n", @buffer), " <\n" if $#buffer >= 0;
|
|
|
|
@buffer = ();
|
|
|
|
|
|
|
|
print "-" x $columns, "\n";
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2007-03-29 22:39:54 +02:00
|
|
|
# unlink($normal1);
|
|
|
|
# unlink($normal2);
|
2007-11-08 21:56:37 +01:00
|
|
|
exit($res ? ((defined $ENV{CLIENT_TEST_COMPARISON_FAILED}) ? int($ENV{CLIENT_TEST_COMPARISON_FAILED}) : 1) : 0);
|
2006-12-17 17:36:17 +01:00
|
|
|
} else {
|
|
|
|
# normalize
|
|
|
|
my $in;
|
|
|
|
if( $#ARGV >= 0 ) {
|
|
|
|
open(IN, "<$ARGV[0]") || die "$ARGV[0]: $!";
|
|
|
|
$in = *IN{IO};
|
|
|
|
} else {
|
|
|
|
$in = *STDIN{IO};
|
|
|
|
}
|
|
|
|
|
2007-03-29 22:39:54 +02:00
|
|
|
print STDOUT join("\n", Normalize($in, $columns)), "\n";
|
2006-12-17 17:36:17 +01:00
|
|
|
}
|