# Module of TWiki Enterprise Collaboration Platform, http://TWiki.org/
#
# Changes copyright (C) 2005 Sven Dowideit http://www.home.org.au
# Copyright (C) 2004-2006 TWiki Contributors. All Rights Reserved. 
# TWiki Contributors are listed in the AUTHORS file in the root of 
# this distribution. NOTE: Please extend that file, not this notice.
#
# This program is free software; you can redistribute it and/or
# modify it under the terms of the GNU General Public License
# as published by the Free Software Foundation; either version 2
# of the License, or (at your option) any later version. For
# more details read LICENSE in the root of this distribution.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
#
# As per the GPL, removal of this notice is prohibited.
#
# Support functionality for TWiki
#
# Jul 2004 - copied almost completely from Sven's updateTopics.pl script:
#            put in a package and made a subroutine to work with UpgradeTWiki 
#             by Martin "GreenAsJade" Gregory.


package TWiki::Upgrade::UpdateTopics;

use strict;

use TWiki::Upgrade;
use File::Find;
use File::Copy;
use File::Basename;
use Text::Diff;

# Try to upgrade an installation's TWikiTopics using the rcs info in it.

use vars qw($CurrentDataDir $NewReleaseDataDir $DestinationDataDir $debug $RcsLogFile $TempDir $upgradeObj);
#					@DefaultWebTopics %LinkedDirPathsInWiki);

sub UpdateTopics 
{
	$debug = 0;	#Set if you want to see the debug output
	$upgradeObj = shift;
    $NewReleaseDataDir = shift or die "UpdateTopics not provided with new data directory!\n";
    $CurrentDataDir = shift or die "UpdateTopics not provided with existing data directory!\n";
    $DestinationDataDir = shift or die "DestinationDataDir not provided\n";

    mkdir( $DestinationDataDir, 0777);
    $TempDir = "$DestinationDataDir/tmp";
    while (-d $TempDir ) { $TempDir .= 'p' }   # we want our own previously non-existing directory!
    mkdir( $TempDir, 0777) or die "Uhoh - couldn't make a temporary directory called $TempDir: $!\n";

    $upgradeObj->writeToLogAndScreen("\n---\n$NewReleaseDataDir , $CurrentDataDir , $DestinationDataDir\n----\n");

    my $whoCares = `which rcsdiff`;   # we should use File::Which to do this, except that would mean
                                      # getting yet another .pm into lib, which seems like hard work?
    ($? >> 8 == 0) or die "Uh-oh - couldn't see an rcs executable on your path!  I really need one of those!\n";

    $whoCares = `which patch`;
    ($? >> 8 == 0) or die "Uh-oh - couldn't see a patch executable on your path!  I really need one of those!\n";

    $upgradeObj->writeToLogAndScreen("\n");
    $upgradeObj->writeToLogAndScreen("\t...new upgraded data will be put in $DestinationDataDir\n");
    $upgradeObj->writeToLogAndScreen("\t   there will be no changes made to either the source data directory or $NewReleaseDataDir.\n\n"); 
    $upgradeObj->writeToLogAndScreen("\t This progam will attempt to use the rcs versioning information to upgrade the\n");
    $upgradeObj->writeToLogAndScreen("\t   contents of your distributed topics in $CurrentDataDir to the content in $NewReleaseDataDir.\n\n");
    $upgradeObj->writeToLogAndScreen("Output:\n");
    $upgradeObj->writeToLogAndScreen("\tFor each file that has no versioning information in your existing twiki a _v_ will be printed\n");
    $upgradeObj->writeToLogAndScreen("\tFor each file that has no changes from the previous release a _c_ will be printed\n");
    $upgradeObj->writeToLogAndScreen("\tFor each file that has no changes made in your existing release, a _u_ will be printed (new version is copied)\n");
    $upgradeObj->writeToLogAndScreen("\tFor each file where no commonality could be found, your existing one is used, and a _C_ will be printed\n");
    $upgradeObj->writeToLogAndScreen("\tFor each file that has changes and a patch is generated a _p_ will be printed\n");
    $upgradeObj->writeToLogAndScreen("\tFor each file that is new in the NewReleaseDataDir a _+_ will be printed\n");
    $upgradeObj->writeToLogAndScreen("\t When the script has attempted to patch the $NewReleaseDataDir, 
\t *.rej files will contain the failed merges\n");
    $upgradeObj->writeToLogAndScreen("\t although many of these rejected chages will be discardable, 
\t please check them to see if your configuration is still ok\n\n");


	#redirect stderr into a file (rcs dumps out heaps of info)
    $RcsLogFile = $DestinationDataDir."/rcs.log";
    unlink($RcsLogFile);  # let's have just the messages from this session!

    open(PATCH, "> $DestinationDataDir/patchTopics");
    
    $upgradeObj->writeToLogAndScreen("\n\n ...checking existing files from $CurrentDataDir\n");
#TODO: need to find a way to detect non-Web directories so we don't make a mess of them..
# (should i just ignore Dirs without any ,v files?) - i can't upgrade them anyway..
#upgrade templates..?

    my %findOptions;

    $findOptions{'wanted'} = \&getRLog;
    $findOptions{'follow_fast'} = 1;   # surely the user hasn't put loops of links etc in their data!?

    find(\%findOptions, $CurrentDataDir);

    close(PATCH);

#do a find through $NewReleaseDataDir and copy all missing files & dirs
    $upgradeObj->writeToLogAndScreen("\n\n ... checking for new files in $NewReleaseDataDir");
    find(\&copyNewTopics, $NewReleaseDataDir);
    
#run `patch patchTopics` in $DestinationDataDir
    $upgradeObj->writeToLogAndScreen("\nPatching topics (manually check the rejected patch (.rej) files)");
    chdir($DestinationDataDir);
    `patch -p0 < patchTopics > patch.log`;
#TODO: examing the .rej files to remove the ones that have already been applied
    find(\&listRejects, ".");
#TODO: run `ci` in $DestinationDataDir
    
    $upgradeObj->writeToLogAndScreen("\n\n");
    
    # fix up permissions ... get them to a working state, if not ideal seurity-wise!
	# (we tell the user to check the permissions later anyhow)
	$upgradeObj->writeToLogAndScreen("
		Now I'm giving everyone write access to $DestinationDataDir, 
		so your web server user can access them.
		");
	find( sub {chmod 0777, $File::Find::name;} , $DestinationDataDir);
    
    rmdir($TempDir);
}
    
# ============================================
sub listRejects
{
    my ( $filename ) = @_;
    
    $filename = $File::Find::name;

    if ($filename =~ /.rej$/ ) {
        $upgradeObj->writeToLogAndScreen("\nPatch rejected: $filename");
    }
}

# ============================================
sub copyNewTopics
{
    my ( $filename ) = $File::Find::name;

    my $destinationFilename = $filename;
    $destinationFilename =~ s/$NewReleaseDataDir/$DestinationDataDir/g;

# Sven had these commeted out, so I've left them here commented out.
#    return if $filename =~ /,v$/;
#    return if $filename =~ /.lock$/;
#    return if $filename =~ /~$/;
	return if $filename =~ /\.svn.*/;	#don't follow into .svn dirs

    if ( -d $filename) {
        $upgradeObj->writeToLogAndScreen("\nprocessing directory $filename");
		if ( !-d $destinationFilename ) {
	    	$upgradeObj->writeToLogAndScreen(" (creating $destinationFilename)");
	    	mkdir($destinationFilename, 0777);
		}
        return;
    }
    
    if (! -e $destinationFilename ) { 
        $upgradeObj->writeToLog("\nadding $filename (new in this release)");
        $upgradeObj->writeToScreen('+');
        copy( $filename, $destinationFilename);
    }
    
}

# ============================================
sub getRLog
{
    my ( $filename ) = $File::Find::name;

	if ($filename =~ /\.rej$/) {		#don't copy reject files from upgrade 
		#SMELL: this is going to be bad if someone has attached a .rej file...
		$upgradeObj->writeToLog("\nfound rejected patch file from previous upgrade ($filename) - not copying it");
		return;
	}

    my ( $newFilename ) = $filename;
    if (!$filename =~ /^$CurrentDataDir/)
    {
		die "getRLog found $filename that appears not to be in $CurrentDataDir tree! That's not supposed to happen: sorry!\n";
    }
	
    $newFilename =~ s/$CurrentDataDir/$NewReleaseDataDir/g;

    my $destinationFilename = $filename;
    $destinationFilename =~ s/$CurrentDataDir/$DestinationDataDir/g;

    if ($filename =~ /,v$/ or $filename =~ /.lock$/ or $filename =~ /~$/) {
		#$upgradeObj->writeToLog("skipping ($filename)\n");
		return;
    }

    $upgradeObj->writeToLog("\n$filename -> $newFilename : ");

    if ( -d $filename ) {
	$upgradeObj->writeToLogAndScreen("\nprocessing directory (creating $destinationFilename)\n");
        mkdir($destinationFilename, 0777);
        return;
    }
    
#    if ( isFromDefaultWeb($filename) )
#    {
#        $newFilename =~ s|^(.*)/[^/]*/([^/]*)|$1/_default/$2|g;
#        $upgradeObj->writeToLogAndScreen("\n$filename appears to have been generated from from _default - merging with $newFilename from the new distribution" if ($debug);
#    }
    
    if (! -e $filename.",v" )
    {
        if ( $filename =~ /.txt$/ ) {
	    # here we defer making an RCS file for this file to someone else :-)
	    # (probably the process that checks all the new wiki files back in)
            $upgradeObj->writeToLog("\nWarning: $filename does not have any rcs information");
            $upgradeObj->writeToScreen("v");
        }
        copy( $filename, $destinationFilename);
        return;
    }

    # make it easy for debugging to turn on or off the business about
    # checking in the existing files before rcsdiffing them
    # this is necessary, because you have to make changes in two places to make
    # this switch, and if you forget the second one you're gunna delete lots of files
    # you wanted to keep!

    my $doCiCo = 1;
#   my $doCiCo = 0;

    # Now - the main business: if we're looking at a file that has a new version in
    # the new distribution then we have to try merging etc...

    if ( -e $newFilename ) { 
        # file that may need upgrading

	my $workingFilename;

	if (!$doCiCo)
	{
	    $workingFilename = $filename;
	}
	else
	{
	    $workingFilename = "$TempDir/". basename($filename);
	    
	    $upgradeObj->writeToLog("\nWorking file: $workingFilename");
	    
	    copy ( $filename, $workingFilename)
		or die "Couldn't make copy of $filename at $workingFilename: $!\n";

	    copy ( "$filename,v", "$workingFilename,v")
		or die "Couldn't make copy of $filename,v at $workingFilename,v: $!\n";
	    
	    # This procedure copied from UI::Manage.pm
	    # could be perhaps performed in less steps, but who cares...
	    # break lock
	    system("rcs -q -u -M $workingFilename 2>>$RcsLogFile");
	    # relock
	    system("rcs -q -l $workingFilename 2>>$RcsLogFile");
	    # check outstanding changes in (note that -t- option should never be used, but it's there for completeness,
	    #  and since it was in Manage.pm)
	    system("ci -u -mUpdateTopics -t-missing_v $workingFilename 2>>$RcsLogFile");
	}

    my $highestCommonRevision = findHighestCommonRevision( $workingFilename, $newFilename);

	# is it the final version of $filename? 
	# (in which case:
#TODO: what about manually updated files?


#TODO: need to do something different if we are upgrading from a beta to the release
    if ( $highestCommonRevision =~ /\d*\.\d*/ ) 
	{
        my $diff = doDiffToHead( $workingFilename, $highestCommonRevision );

	    $diff = removeVersionChangeDiff($diff);
        patchFile( $filename, $destinationFilename, $diff );

            $upgradeObj->writeToLog("\ncreating a patch for $newFilename from $filename ($highestCommonRevision)");
            $upgradeObj->writeToScreen("p");
            copy( $newFilename, $destinationFilename);
            copy( $newFilename.",v", $destinationFilename.",v");
    } elsif ($highestCommonRevision eq "head" ) {
	    # This uses the existing file rather than the new one, in case they manually
	    # changed the exisiting one without using RCS.
            $upgradeObj->writeToLog("\nhighest common revision is final revision in oldTopic (using new Version)");
            $upgradeObj->writeToScreen("u");
            copy( $newFilename, $destinationFilename);
            copy( $newFilename.",v", $destinationFilename.",v");
    } else {
            #no common versions - this might be a user created file, 
            #or a manual attempt at creating a topic off twiki.org?raw=on
#TODO: do something nicer about this.. I think i need to do lots of diffs 
            #to see if there is any commonality
            $upgradeObj->writeToLog("\nWarning: copying $filename (no common versions)");
            $upgradeObj->writeToScreen("C");
            copy( $filename, $destinationFilename);
            copy( $filename.",v", $destinationFilename.",v");
    }

	if ( $doCiCo )
	{
	    unlink ($workingFilename, "$workingFilename,v") or
		warn "Couldn't remove temporary files $workingFilename, $workingFilename,v: $! Could be trouble ahead...\n";
	}

    } else {
        #new file created by users
#TODO: this will include topics copied using ManagingWebs (createWeb)
        $upgradeObj->writeToLog("\ncopying $filename (user's existing file)");
        $upgradeObj->writeToScreen("c");
        copy( $filename, $destinationFilename);
        copy( $filename.",v", $destinationFilename.",v");
    }
}

# ==============================================
sub isFromDefaultWeb
{
    my ($filename) = @_;

    opendir(DEFAULTWEB, './data/_default') or die "Yikes - couldn't open ./data/_default: $! ... not safe to proceed!\n";
    my @DefaultWebTopics = grep(/.txt$/, readdir(DEFAULTWEB));
    if ($debug) { $upgradeObj->writeToLogAndScreen("_default topics in new distro: @DefaultWebTopics\n"); }

    my $topic = basename($filename);
    return $topic if grep(/^$topic$/, @DefaultWebTopics);
}

# ==============================================
sub doDiffToHead
{
    my ( $filename, $highestCommonRevision ) = @_;
   
#    $upgradeObj->writeToLogAndScreen("$highestCommonRevision to ".getHeadRevisionNumber($filename)."\n");
#    $upgradeObj->writeToLogAndScreen("\n----------------\n".getRevision($filename, $highestCommonRevision));
#     $upgradeObj->writeToLogAndScreen("\n----------------\n".getRevision($filename, getHeadRevisionNumber($filename))) ;
#    return diff ( getRevision($filename, $highestCommonRevision), getRevision($filename, getHeadRevisionNumber($filename)) ));

    my $cmd = "rcsdiff -r".$highestCommonRevision." -r".getHeadRevisionNumber($filename)." $filename";
    $upgradeObj->writeToLogAndScreen("\n----------------\n".$cmd)  if ($debug);
    my $diffs =  `$cmd 2>>$RcsLogFile`;
    return $diffs;
}

# ==============================================
sub patchFile
{
    my ( $oldFilename, $destinationFilename, $diff ) = @_;


    # Here's where we do a total hack to get WIKIWEBLIST right.  
    # we have to check every stinkin line of diff just to intercept this one :-(

    my @diff;

    @diff = split(/\r?\n/, $diff);

    my $i;

    for($i = 0; $i < @diff ; $i++)
    {
		if ($diff[$i] =~ m/<\s*\* Set WIKIWEBLIST = /)
		{
		    # come to mama
		    # this had better be the value in the distribution!...
		    $diff[$i] = '< 		* Set WIKIWEBLIST = [[%MAINWEB%.%HOMETOPIC%][%MAINWEB%]] %SEP% [[%TWIKIWEB%.%HOMETOPIC%][%TWIKIWEB%]] %SEP% [[Sandbox.%HOMETOPIC%][Sandbox]]';
		    last;
		}
    }
    
    $diff = join("\n", @diff);

    # this looks odd: it's just telling patch to apply the patch to $destinationFilename
    # perhaps only one file name line would do, but better safe than sorry!    
    # (diffs always seem to have two lines)
    print(PATCH "--- $destinationFilename\n");
    print(PATCH "--- $destinationFilename\n");

    print(PATCH "$diff\n");

#    print(PATCH, "");
    
    #patch ($newFilename, $diff);
# and then do an rcs ci (check-in)
}

# ==============================================
sub getHeadRevisionNumber
{
    my ( $filename ) = @_;
    
    my ( $cmd ) = "rlog ".$filename.",v";

    my $line;

    my @response = `$cmd 2>>$RcsLogFile`;
    foreach $line (@response) {
        next unless $line =~ /^head: (\d*\.\d*)/;
        return $1;
    }
    return "";    
}

# ==============================================
#returns, as a string, the highest revision number common to both files
#Note: we return nothing if the highestcommon verison is also the last version of $filename
#TODO: are teh rcs versions always 1.xxx ? if not, how do we know?
sub findHighestCommonRevision 
{
    my ( $filename, $newFilename) = @_;
    
    my $rev = 1;
    my $commonRev = "";

    my $oldContent = "qwer";
    my $newContent = "qwer";
    while ( ( $oldContent ne "" ) & ($newContent ne "") ) {
        $upgradeObj->writeToLog("\ncomparing $filename and $newFilename revision 1.$rev ");
        $oldContent = getRevision( $filename, "1.".$rev);
        $newContent = getRevision( $newFilename, "1.".$rev);
        if ( ( $oldContent ne "" ) & ($newContent ne "") ) {
            my $diffs = diff( \$oldContent, \$newContent, {STYLE => "Unified"} );
#            $upgradeObj->writeToLogAndScreen("\n-----------------------|".$diffs."|-------------------\n");
#            $upgradeObj->writeToLogAndScreen("\n-------------------[".$oldContent."]----|".$diffs."|-------[".$newContent."]--------------\n");
            if ( $diffs eq "" ) {
                #same!!
                $commonRev = "1.".$rev;
            }
        }
        $rev = $rev + 1;
    }

    $upgradeObj->writeToLog("\nlastCommon = $commonRev (head = ".getHeadRevisionNumber( $filename).")");
    
    if ( $commonRev eq getHeadRevisionNumber( $filename) ) {
        return "head";
    }
    
    return $commonRev;
}

# ==============================================
#returns an empty string if the version does not exist
sub getRevision
{
    my ( $filename, $rev ) = @_;

# use rlog to test if the revision exists..
    my ( $cmd ) = "rlog -r".$rev." ".$filename;

#$upgradeObj->writeToLogAndScreen($cmd."\n");
    my @response = `$cmd 2>>$RcsLogFile`;

    my $revision;
    my $line;
    foreach $line (@response) {
        next unless $line =~ /^revision (\d*\.\d*)/;
        $revision = $1;
    }

    my $content = "";

    if ( $revision and ($revision eq $rev) ) {
        $cmd = "co -p".$rev." ".$filename;
        $content = `$cmd 2>>$RcsLogFile`;
    }

    return $content;
}

# $diff is assumed to contain the diff between two similar TWiki topics
# TWiki topics should, as a rule, differ in the first line with respect to
# their version number.   This routine gets rid of that component of the diff.
# It could be more rigorous (like testing if the 1c1 change relates to %META).
# The diff is assumed not to contain the preamble.

sub removeVersionChangeDiff
{
    my ($diff) = @_;

    my @diff = split( /\r?\n/, $diff);

    if ($diff[0] eq '1c1')
    {
	splice(@diff, 0, 4);
    }

    $diff = join "\n", @diff;

#    $upgradeObj->writeToLogAndScreen("rVCD returning: \n$diff\n");

    return $diff;
}
    
1;
