v50 Steam/Premium information for editors
  • v50 information can now be added to pages in the main namespace. v0.47 information can still be found in the DF2014 namespace. See here for more details on the new versioning policy.
  • Use this page to report any issues related to the migration.
This notice may be cached—the current version can be found here.

Difference between revisions of "User:Quietust/rawextract.pl"

From Dwarf Fortress Wiki
Jump to navigation Jump to search
m (add 0.43.01)
m (add versions up thru 0.43.05)
Line 77: Line 77:
  
 
1551, '0.43.01',
 
1551, '0.43.01',
 +
1552, '0.43.02',
 +
1553, '0.43.03',
 +
1555, '0.43.04',
 +
1556, '0.43.05',
 
);
 
);
  
Line 125: Line 129:
 
$version = readLong($raw);
 
$version = readLong($raw);
 
if (exists($versions{$version})) { print "World is from version $versions{$version}\n"; }
 
if (exists($versions{$version})) { print "World is from version $versions{$version}\n"; }
else { print "World is from an unrecognized version!\n"; }
+
else { print "World is from an unrecognized version '$version'!\n"; }
 
my $comp = readLong($raw);
 
my $comp = readLong($raw);
 
if ($comp == 1) { $raw = decompress($version, $raw); }
 
if ($comp == 1) { $raw = decompress($version, $raw); }
Line 152: Line 156:
 
$version = readLong($raw);
 
$version = readLong($raw);
 
if (exists($versions{$version})) { print "World is from version $versions{$version}\n"; }
 
if (exists($versions{$version})) { print "World is from version $versions{$version}\n"; }
else { print "World is from an unrecognized version!\n"; }
+
else { print "World is from an unrecognized version '$version'!\n"; }
 
my $comp = readLong($raw);
 
my $comp = readLong($raw);
 
if ($comp == 1) { $raw = decompress($version, $raw); }
 
if ($comp == 1) { $raw = decompress($version, $raw); }

Revision as of 01:24, 4 January 2017

#!/usr/bin/env perl

use strict;

use File::Temp qw/tempfile/;
use Compress::Zlib;

my %versions = (
	1287, '0.31.01',
	1288, '0.31.02',
	1289, '0.31.03',
	1292, '0.31.04',
	1295, '0.31.05',
	1297, '0.31.06',
	1300, '0.31.08',
	1304, '0.31.09',
	1305, '0.31.10',
	1310, '0.31.11',
	1311, '0.31.12',
	1323, '0.31.13',
	1325, '0.31.14',
	1326, '0.31.15',
	1327, '0.31.16',
	1340, '0.31.17',
	1341, '0.31.18',
	1351, '0.31.19',
	1353, '0.31.20',
	1354, '0.31.21',
	1359, '0.31.22',
	1360, '0.31.23',
	1361, '0.31.24',
	1362, '0.31.25',

	1372, '0.34.01',
	1374, '0.34.02',
	1376, '0.34.03',
	1377, '0.34.04',
	1378, '0.34.05',
	1382, '0.34.06',
	1383, '0.34.07',
	1400, '0.34.08',
	1402, '0.34.09',
	1403, '0.34.10',
	1404, '0.34.11',

	1441, '0.40.01',
	1442, '0.40.02',
	1443, '0.40.03',
	1444, '0.40.04',
	1445, '0.40.05',
	1446, '0.40.06',
	1448, '0.40.07',
	1449, '0.40.08',
	1451, '0.40.09',
	1452, '0.40.10',
	1456, '0.40.11',
	1459, '0.40.12',
	1462, '0.40.13',
	1469, '0.40.14',
	1470, '0.40.15',
	1471, '0.40.16',
	1472, '0.40.17',
	1473, '0.40.18',
	1474, '0.40.19',
	1477, '0.40.20',
	1478, '0.40.21',
	1479, '0.40.22',
	1480, '0.40.23',
	1481, '0.40.24',

	1531, '0.42.01',
	1532, '0.42.02',
	1533, '0.42.03',
	1534, '0.42.04',
	1537, '0.42.05',
	1542, '0.42.06',

	1551, '0.43.01',
	1552, '0.43.02',
	1553, '0.43.03',
	1555, '0.43.04',
	1556, '0.43.05',
);

sub decompress {
	my ($version, $file) = @_;
	my $out = tempfile();
	binmode($out);

	# write 'uncompressed' header
	print($out pack('VV', $version, 0));

	while (1) {
		my $len = readLong($file);
		if (eof($file)) { last; }
		read($file, my $block, $len);
		print($out uncompress($block));
	}
	seek($out, 8, 0);
	close($file);
	return $out;
}

sub readLong {
	my $file = shift;
	read($file, my $x, 4);
	return unpack('V', $x);
}

sub readShort {
	my $file = shift;
	read($file, my $x, 2);
	return unpack('v', $x);
}

sub readByte {
	my $file = shift;
	read($file, my $x, 1);
	return unpack('C', $x);
}

my $dir = '';
if (@ARGV > 0) { $dir = $ARGV[0] .'/'; }
my $version = -1;
my $raw;

if (open($raw, '<', $dir.'world.dat')) {
	binmode($raw);
	$version = readLong($raw);
	if (exists($versions{$version})) { print "World is from version $versions{$version}\n"; }
	else { print "World is from an unrecognized version '$version'!\n"; }
	my $comp = readLong($raw);
	if ($comp == 1) { $raw = decompress($version, $raw); }
	elsif ($comp > 0) { die("world.dat file is corrupted!"); }

	seek($raw, 0x46, 1);
	if ($version >= 1372) { seek($raw, 0x14, 1); }
	if ($version >= 1400) { seek($raw, 0x4, 1); }
	if ($version >= 1441) { seek($raw, 0x14, 1); }
	if ($version >= 1531) { seek($raw, 0x18, 1); }
	if (readByte($raw)) {
		seek($raw, readShort($raw), 1);
		seek($raw, readShort($raw), 1);
		seek($raw, 0x30, 1);
	}
	seek($raw, 0xF, 1);

	my $len = readShort($raw);
	read($raw, my $world, $len);
	print "Extracting randomly generated raws of $world:\n\n";
}
elsif (open($raw, '<', $dir.'world.sav'))
{
	binmode($raw);

	$version = readLong($raw);
	if (exists($versions{$version})) { print "World is from version $versions{$version}\n"; }
	else { print "World is from an unrecognized version '$version'!\n"; }
	my $comp = readLong($raw);
	if ($comp == 1) { $raw = decompress($version, $raw); }
	elsif ($comp > 0) { die("world.sav file is corrupted!"); }

	seek($raw, 0x56, 1);
	if ($version >= 1372) { seek($raw, 0x14, 1); }
	if ($version >= 1400) { seek($raw, 0x4, 1); }
	if ($version >= 1441) { seek($raw, 0x14, 1); }
	if ($version >= 1531) { seek($raw, 0x18, 1); }

	my $len = readShort($raw);
	read($raw, my $name, $len);

	$len = readShort($raw);
	read($raw, my $world, $len);
	print "Extracting randomly generated raws of $world:\n\n";
	readLong($raw); # year
}
else { die("Could not open world.dat or world.sav!"); }

sub extractList {
	my ($raw, $type, $token) = @_;

	my $count = readLong($raw);
	print "Extracting $count $type definitions...\n";

	for (my $i = 0; $i < $count; $i++) {
		my $data = '';
		my $file = $type.'_'.$i;
		my $numLines = readLong($raw);
		for (my $j = 0; $j < $numLines; $j++) {
			my $len = readShort($raw);
			read($raw, my $str, $len);
			$data .= "$str\n";
			if ($str =~ /\[$token:(.*?)\]/) { $file = $1; }
		}
		print "$file...\n";
		open (OUTFILE, '>', $file.'.txt');
		print(OUTFILE $data);
		close(OUTFILE);
	}
}

if ($version >= 1372) { extractList($raw, 'material', 'INORGANIC'); }

if ($version >= 1441) { extractList($raw, 'plant', 'PLANT'); }

if ($version >= 1400) { extractList($raw, 'item', 'ITEM_.*?'); }

extractList($raw, 'creature', 'CREATURE');

if ($version >= 1441) { extractList($raw, 'entity', 'ENTITY'); }

if ($version >= 1531) { extractList($raw, 'reaction', 'REACTION'); }

if ($version >= 1372) { extractList($raw, 'interaction', 'INTERACTION'); }

if ($version >= 1441) { extractList($raw, 'language', 'TRANSLATION'); }

print "done!\n";