v50 Steam/Premium information for editors
  • v50 information can now be added to pages in the main namespace. v0.47 information can still be found in the DF2014 namespace. See here for more details on the new versioning policy.
  • Use this page to report any issues related to the migration.
This notice may be cached—the current version can be found here.

Difference between revisions of "User:Quietust/rawextract.php"

From Dwarf Fortress Wiki
Jump to navigation Jump to search
m (add newer versions)
 
(20 intermediate revisions by 2 users not shown)
Line 1: Line 1:
  <nowiki><?
+
  <nowiki><?php
 
$versions = array(
 
$versions = array(
 
1287 => '0.31.01',
 
1287 => '0.31.01',
Line 43: Line 43:
 
1444 => '0.40.04',
 
1444 => '0.40.04',
 
1445 => '0.40.05',
 
1445 => '0.40.05',
 +
1446 => '0.40.06',
 +
1448 => '0.40.07',
 +
1449 => '0.40.08',
 +
1451 => '0.40.09',
 +
1452 => '0.40.10',
 +
1456 => '0.40.11',
 +
1459 => '0.40.12',
 +
1462 => '0.40.13',
 +
1469 => '0.40.14',
 +
1470 => '0.40.15',
 +
1471 => '0.40.16',
 +
1472 => '0.40.17',
 +
1473 => '0.40.18',
 +
1474 => '0.40.19',
 +
1477 => '0.40.20',
 +
1478 => '0.40.21',
 +
1479 => '0.40.22',
 +
1480 => '0.40.23',
 +
1481 => '0.40.24',
 +
 +
1531 => '0.42.01',
 +
1532 => '0.42.02',
 +
1533 => '0.42.03',
 +
1534 => '0.42.04',
 +
1537 => '0.42.05',
 +
1542 => '0.42.06',
 +
 +
1551 => '0.43.01',
 +
1552 => '0.43.02',
 +
1553 => '0.43.03',
 +
1555 => '0.43.04',
 +
1556 => '0.43.05',
 +
 +
1596 => '0.44.01',
 +
1597 => '0.44.02',
 +
1600 => '0.44.03',
 +
1603 => '0.44.04',
 +
1604 => '0.44.05',
 +
1611 => '0.44.06',
 +
1612 => '0.44.07',
 +
1613 => '0.44.08',
 +
1614 => '0.44.09',
 +
1620 => '0.44.10',
 +
1623 => '0.44.11',
 +
1625 => '0.44.12',
 +
 +
1710 => '0.47.01',
 +
1711 => '0.47.02',
 +
1712 => '0.47.03',
 +
1715 => '0.47.04',
 +
1716 => '0.47.05',
 +
 +
2078 => '0.50.01',
 +
2079 => '0.50.02',
 +
2080 => '0.50.03', // through 0.50.04
 +
2081 => '0.50.05', // through 0.50.12
 +
2082 => '0.50.13', // through 0.50.15
 +
 +
3013 => '0.51.02', // through 0.51.08
 
);
 
);
  
Line 52: Line 111:
 
while (1)
 
while (1)
 
{
 
{
$len = readLong($file);
+
$len = @readLong($file);
 
if (feof($file))
 
if (feof($file))
 
break;
 
break;
Line 94: Line 153:
 
if (isset($versions[$version]))
 
if (isset($versions[$version]))
 
echo "World is from version $versions[$version]\n";
 
echo "World is from version $versions[$version]\n";
else echo "World is from an unrecognized version!\n";
+
else echo "World is from an unrecognized version '$version'!\n";
 
$comp = readLong($raw);
 
$comp = readLong($raw);
 
if ($comp == 1)
 
if ($comp == 1)
Line 104: Line 163:
 
if ($version >= 1372)
 
if ($version >= 1372)
 
fseek($raw, 0x14, SEEK_CUR);
 
fseek($raw, 0x14, SEEK_CUR);
if ($version >= 1400)
+
if ($version >= 1384)
 
fseek($raw, 0x4, SEEK_CUR);
 
fseek($raw, 0x4, SEEK_CUR);
 
if ($version >= 1441)
 
if ($version >= 1441)
 
fseek($raw, 0x14, SEEK_CUR);
 
fseek($raw, 0x14, SEEK_CUR);
 +
if ($version >= 1484)
 +
fseek($raw, 0xC, SEEK_CUR);
 +
if ($version >= 1485)
 +
fseek($raw, 0x8, SEEK_CUR);
 +
if ($version >= 1493)
 +
fseek($raw, 0x4, SEEK_CUR);
 +
if ($version >= 1571)
 +
fseek($raw, 0x4, SEEK_CUR);
 +
if ($version >= 1662)
 +
fseek($raw, 0x8, SEEK_CUR);
 +
 
if (readByte($raw))
 
if (readByte($raw))
 
{
 
{
Line 118: Line 188:
 
$len = readShort($raw);
 
$len = readShort($raw);
 
$world = fread($raw, $len);
 
$world = fread($raw, $len);
 +
 +
if ($version >= 2072)
 +
{
 +
fseek($raw, 0x8, SEEK_CUR);
 +
fseek($raw, readShort($raw), SEEK_CUR);
 +
fseek($raw, readShort($raw), SEEK_CUR);
 +
fseek($raw, 0x10, SEEK_CUR);
 +
fseek($raw, readShort($raw), SEEK_CUR);
 +
fseek($raw, 0x4, SEEK_CUR);
 +
}
 +
 
echo "Extracting randomly generated raws of $world:\n\n";
 
echo "Extracting randomly generated raws of $world:\n\n";
 
}
 
}
Line 129: Line 210:
 
if (isset($versions[$version]))
 
if (isset($versions[$version]))
 
echo "World is from version $versions[$version]\n";
 
echo "World is from version $versions[$version]\n";
else echo "World is from an unrecognized version!\n";
+
else echo "World is from an unrecognized version '$version'!\n";
 
$comp = readLong($raw);
 
$comp = readLong($raw);
 
if ($comp == 1)
 
if ($comp == 1)
Line 139: Line 220:
 
if ($version >= 1372)
 
if ($version >= 1372)
 
fseek($raw, 0x14, SEEK_CUR);
 
fseek($raw, 0x14, SEEK_CUR);
if ($version >= 1400)
+
if ($version >= 1384)
 
fseek($raw, 0x4, SEEK_CUR);
 
fseek($raw, 0x4, SEEK_CUR);
if ($version >= 1441) // GUESS
+
if ($version >= 1441)
 
fseek($raw, 0x14, SEEK_CUR);
 
fseek($raw, 0x14, SEEK_CUR);
 +
if ($version >= 1484)
 +
fseek($raw, 0xC, SEEK_CUR);
 +
if ($version >= 1485)
 +
fseek($raw, 0x8, SEEK_CUR);
 +
if ($version >= 1493)
 +
fseek($raw, 0x4, SEEK_CUR);
 +
if ($version >= 1571)
 +
fseek($raw, 0x4, SEEK_CUR);
 +
if ($version >= 1662)
 +
fseek($raw, 0x8, SEEK_CUR);
  
 
$len = readShort($raw);
 
$len = readShort($raw);
Line 149: Line 240:
 
$len = readShort($raw);
 
$len = readShort($raw);
 
$world = fread($raw, $len);
 
$world = fread($raw, $len);
echo "Extracting randomly generated raws of $world:\n\n";
+
$year = readLong($raw);
readLong($raw); // year
 
}
 
 
 
if ($version >= 1441)
 
{
 
$numDivineMats = readLong($raw);
 
  
for ($i = 0; $i < $numDivineMats; $i++)
+
if ($version >= 2072)
 
{
 
{
$data = '';
+
fseek($raw, 0x8, SEEK_CUR);
$file = "divine_$i";
+
fseek($raw, readShort($raw), SEEK_CUR);
$numLines = readLong($raw);
+
fseek($raw, readShort($raw), SEEK_CUR);
for ($j = 0; $j < $numLines; $j++)
+
fseek($raw, 0x10, SEEK_CUR);
{
+
fseek($raw, readShort($raw), SEEK_CUR);
$len = readShort($raw);
+
fseek($raw, 0x4, SEEK_CUR);
$str = fread($raw, $len);
 
$data .= "$str\r\n";
 
if (preg_match('/\[INORGANIC:(.*?)\]/', $str, $x))
 
$file = $x[1];
 
}
 
echo "$file...\n";
 
file_put_contents($file .'.txt', $data);
 
 
}
 
}
 +
 +
echo "Extracting randomly generated raws of $world year $year:\n\n";
 
}
 
}
  
if ($version >= 1372)
+
function extractList ($raw, $type, $tokens)
 
{
 
{
$numMaterials = readLong($raw);
+
$count = readLong($raw);
 +
echo "Extracting $count $type definitions...\n";
  
for ($i = 0; $i < $numMaterials; $i++)
+
for ($i = 0; $i < $count; $i++)
 
{
 
{
 
$data = '';
 
$data = '';
$file = "material_$i";
+
$file = $type.'_'.$i;
 
$numLines = readLong($raw);
 
$numLines = readLong($raw);
 
for ($j = 0; $j < $numLines; $j++)
 
for ($j = 0; $j < $numLines; $j++)
Line 189: Line 270:
 
$str = fread($raw, $len);
 
$str = fread($raw, $len);
 
$data .= "$str\r\n";
 
$data .= "$str\r\n";
if (preg_match('/\[INORGANIC:(.*?)\]/', $str, $x))
+
foreach ($tokens as $token)
$file = $x[1];
+
if (preg_match('/\['.$token.':(.*?)\]/', $str, $x))
 +
$file = $x[1];
 
}
 
}
 
echo "$file...\n";
 
echo "$file...\n";
Line 197: Line 279:
 
}
 
}
  
if ($version >= 1400)
+
if ($version >= 1372)
{
+
extractList($raw, 'material', array('INORGANIC'));
$numItems = readLong($raw);
 
  
for ($i = 0; $i < $numItems; $i++)
+
if ($version >= 1441)
{
+
extractList($raw, 'plant', array('PLANT'));
$data = '';
 
$file = "item_$i";
 
$numLines = readLong($raw);
 
for ($j = 0; $j < $numLines; $j++)
 
{
 
$len = readShort($raw);
 
$str = fread($raw, $len);
 
$data .= "$str\r\n";
 
if (preg_match('/\[ITEM_.*?:(.*?)\]/', $str, $x))
 
$file = $x[1];
 
}
 
echo "$file...\n";
 
file_put_contents($file .'.txt', $data);
 
}
 
}
 
  
$numCreatures = readLong($raw);
+
if ($version >= 1390)
 +
extractList($raw, 'item', array('ITEM_.*?'));
  
for ($i = 0; $i < $numCreatures; $i++)
+
extractList($raw, 'creature', array('CREATURE'));
{
 
$data = '';
 
$file = "creature_$i";
 
$numLines = readLong($raw);
 
for ($j = 0; $j < $numLines; $j++)
 
{
 
$len = readShort($raw);
 
$str = fread($raw, $len);
 
$data .= "$str\r\n";
 
if (preg_match('/\[CREATURE:(.*?)\]/', $str, $x))
 
$file = $x[1];
 
}
 
echo "$file...\n";
 
file_put_contents($file .'.txt', $data);
 
}
 
  
 
if ($version >= 1441)
 
if ($version >= 1441)
{
+
extractList($raw, 'entity', array('ENTITY'));
$numDivineCreatures = readLong($raw);
 
  
for ($i = 0; $i < $numDivineCreatures; $i++)
+
if ($version >= 1484)
{
+
extractList($raw, 'reaction', array('REACTION'));
$data = '';
 
$file = "divine_creature_$i";
 
$numLines = readLong($raw);
 
for ($j = 0; $j < $numLines; $j++)
 
{
 
$len = readShort($raw);
 
$str = fread($raw, $len);
 
$data .= "$str\r\n";
 
if (preg_match('/\[CREATURE:(.*?)\]/', $str, $x))
 
$file = $x[1];
 
}
 
echo "$file...\n";
 
file_put_contents($file .'.txt', $data);
 
}
 
}
 
  
 
if ($version >= 1372)
 
if ($version >= 1372)
{
+
extractList($raw, 'interaction', array('INTERACTION'));
$numInteractions = readLong($raw);
 
  
for ($i = 0; $i < $numInteractions; $i++)
+
if ($version >= 1423)
{
+
extractList($raw, 'language', array('TRANSLATION'));
$data = '';
 
$file = "interaction_$i";
 
$numLines = readLong($raw);
 
for ($j = 0; $j < $numLines; $j++)
 
{
 
$len = readShort($raw);
 
$str = fread($raw, $len);
 
$data .= "$str\r\n";
 
if (preg_match('/\[INTERACTION:(.*?)\]/', $str, $x))
 
$file = $x[1];
 
}
 
echo "$file...\n";
 
file_put_contents($file .'.txt', $data);
 
}
 
}
 
 
 
if ($version >= 1441)
 
{
 
$numDivineLanguages = readLong($raw);
 
 
 
for ($i = 0; $i < $numDivineLanguages; $i++)
 
{
 
$data = '';
 
$file = "divine_language_$i";
 
$numLines = readLong($raw);
 
for ($j = 0; $j < $numLines; $j++)
 
{
 
$len = readShort($raw);
 
$str = fread($raw, $len);
 
$data .= "$str\r\n";
 
if (preg_match('/\[TRANSLATION:(.*?)\]/', $str, $x))
 
$file = $x[1];
 
}
 
echo "$file...\n";
 
file_put_contents($file .'.txt', $data);
 
}
 
}
 
  
 
echo "done!\n";
 
echo "done!\n";
 
?></nowiki>
 
?></nowiki>

Latest revision as of 19:04, 21 March 2025

<?php
$versions = array(
	1287 => '0.31.01',
	1288 => '0.31.02',
	1289 => '0.31.03',
	1292 => '0.31.04',
	1295 => '0.31.05',
	1297 => '0.31.06',
	1300 => '0.31.08',
	1304 => '0.31.09',
	1305 => '0.31.10',
	1310 => '0.31.11',
	1311 => '0.31.12',
	1323 => '0.31.13',
	1325 => '0.31.14',
	1326 => '0.31.15',
	1327 => '0.31.16',
	1340 => '0.31.17',
	1341 => '0.31.18',
	1351 => '0.31.19',
	1353 => '0.31.20',
	1354 => '0.31.21',
	1359 => '0.31.22',
	1360 => '0.31.23',
	1361 => '0.31.24',
	1362 => '0.31.25',

	1372 => '0.34.01',
	1374 => '0.34.02',
	1376 => '0.34.03',
	1377 => '0.34.04',
	1378 => '0.34.05',
	1382 => '0.34.06',
	1383 => '0.34.07',
	1400 => '0.34.08',
	1402 => '0.34.09',
	1403 => '0.34.10',
	1404 => '0.34.11',

	1441 => '0.40.01',
	1442 => '0.40.02',
	1443 => '0.40.03',
	1444 => '0.40.04',
	1445 => '0.40.05',
	1446 => '0.40.06',
	1448 => '0.40.07',
	1449 => '0.40.08',
	1451 => '0.40.09',
	1452 => '0.40.10',
	1456 => '0.40.11',
	1459 => '0.40.12',
	1462 => '0.40.13',
	1469 => '0.40.14',
	1470 => '0.40.15',
	1471 => '0.40.16',
	1472 => '0.40.17',
	1473 => '0.40.18',
	1474 => '0.40.19',
	1477 => '0.40.20',
	1478 => '0.40.21',
	1479 => '0.40.22',
	1480 => '0.40.23',
	1481 => '0.40.24',

	1531 => '0.42.01',
	1532 => '0.42.02',
	1533 => '0.42.03',
	1534 => '0.42.04',
	1537 => '0.42.05',
	1542 => '0.42.06',

	1551 => '0.43.01',
	1552 => '0.43.02',
	1553 => '0.43.03',
	1555 => '0.43.04',
	1556 => '0.43.05',

	1596 => '0.44.01',
	1597 => '0.44.02',
	1600 => '0.44.03',
	1603 => '0.44.04',
	1604 => '0.44.05',
	1611 => '0.44.06',
	1612 => '0.44.07',
	1613 => '0.44.08',
	1614 => '0.44.09',
	1620 => '0.44.10',
	1623 => '0.44.11',
	1625 => '0.44.12',

	1710 => '0.47.01',
	1711 => '0.47.02',
	1712 => '0.47.03',
	1715 => '0.47.04',
	1716 => '0.47.05',

	2078 => '0.50.01',
	2079 => '0.50.02',
	2080 => '0.50.03', // through 0.50.04
	2081 => '0.50.05', // through 0.50.12
	2082 => '0.50.13', // through 0.50.15

	3013 => '0.51.02', // through 0.51.08
);

function decompress ($version, $file)
{
	$out = tmpfile();
	// write 'uncompressed' header
	fwrite($out, pack('VV', $version, 0));
	while (1)
	{
		$len = @readLong($file);
		if (feof($file))
			break;
		$block = fread($file, $len);
		fwrite($out, gzuncompress($block));
	}
	rewind($out);
	// seek past the headers
	fseek($out, 8, SEEK_CUR);
	fclose($file);
	return $out;
}

function readLong ($file)
{
	$x = fread($file, 4);
	$pck = @unpack('Vdata', $x);
	return $pck['data'];
}
function readShort ($file)
{
	$x = fread($file, 2);
	$pck = @unpack('vdata', $x);
	return $pck['data'];
}
function readByte ($file)
{
	$x = fread($file, 1);
	$pck = @unpack('Cdata', $x);
	return $pck['data'];
}

$dir = '';
if ($argc > 1)
	$dir = $argv[1] .'\\';

$raw = @fopen($dir.'world.dat', 'rb');
if ($raw)
{
	$version = readLong($raw);
	if (isset($versions[$version]))
		echo "World is from version $versions[$version]\n";
	else	echo "World is from an unrecognized version '$version'!\n";
	$comp = readLong($raw);
	if ($comp == 1)
		$raw = decompress($version, $raw);
	elseif ($comp > 0)
		die("world.dat file is corrupted!");

	fseek($raw, 0x46, SEEK_CUR);
	if ($version >= 1372)
		fseek($raw, 0x14, SEEK_CUR);
	if ($version >= 1384)
		fseek($raw, 0x4, SEEK_CUR);
	if ($version >= 1441)
		fseek($raw, 0x14, SEEK_CUR);
	if ($version >= 1484)
		fseek($raw, 0xC, SEEK_CUR);
	if ($version >= 1485)
		fseek($raw, 0x8, SEEK_CUR);
	if ($version >= 1493)
		fseek($raw, 0x4, SEEK_CUR);
	if ($version >= 1571)
		fseek($raw, 0x4, SEEK_CUR);
	if ($version >= 1662)
		fseek($raw, 0x8, SEEK_CUR);

	if (readByte($raw))
	{
		fseek($raw, readShort($raw), SEEK_CUR);
		fseek($raw, readShort($raw), SEEK_CUR);
		fseek($raw, 0x30, SEEK_CUR);
	}
	fseek($raw, 0xF, SEEK_CUR);

	$len = readShort($raw);
	$world = fread($raw, $len);

	if ($version >= 2072)
	{
		fseek($raw, 0x8, SEEK_CUR);
		fseek($raw, readShort($raw), SEEK_CUR);
		fseek($raw, readShort($raw), SEEK_CUR);
		fseek($raw, 0x10, SEEK_CUR);
		fseek($raw, readShort($raw), SEEK_CUR);
		fseek($raw, 0x4, SEEK_CUR);
	}

	echo "Extracting randomly generated raws of $world:\n\n";
}
else
{
	$raw = @fopen($dir.'world.sav', 'rb');
	if (!$raw)
		die("Could not open world.dat or world.sav!");

	$version = readLong($raw);
	if (isset($versions[$version]))
		echo "World is from version $versions[$version]\n";
	else	echo "World is from an unrecognized version '$version'!\n";
	$comp = readLong($raw);
	if ($comp == 1)
		$raw = decompress($version, $raw);
	elseif ($comp > 0)
		die("world.sav file is corrupted!");

	fseek($raw, 0x56, SEEK_CUR);
	if ($version >= 1372)
		fseek($raw, 0x14, SEEK_CUR);
	if ($version >= 1384)
		fseek($raw, 0x4, SEEK_CUR);
	if ($version >= 1441)
		fseek($raw, 0x14, SEEK_CUR);
	if ($version >= 1484)
		fseek($raw, 0xC, SEEK_CUR);
	if ($version >= 1485)
		fseek($raw, 0x8, SEEK_CUR);
	if ($version >= 1493)
		fseek($raw, 0x4, SEEK_CUR);
	if ($version >= 1571)
		fseek($raw, 0x4, SEEK_CUR);
	if ($version >= 1662)
		fseek($raw, 0x8, SEEK_CUR);

	$len = readShort($raw);
	$name = fread($raw, $len);

	$len = readShort($raw);
	$world = fread($raw, $len);
	$year = readLong($raw);

	if ($version >= 2072)
	{
		fseek($raw, 0x8, SEEK_CUR);
		fseek($raw, readShort($raw), SEEK_CUR);
		fseek($raw, readShort($raw), SEEK_CUR);
		fseek($raw, 0x10, SEEK_CUR);
		fseek($raw, readShort($raw), SEEK_CUR);
		fseek($raw, 0x4, SEEK_CUR);
	}

	echo "Extracting randomly generated raws of $world year $year:\n\n";
}

function extractList ($raw, $type, $tokens)
{
	$count = readLong($raw);
	echo "Extracting $count $type definitions...\n";

	for ($i = 0; $i < $count; $i++)
	{
		$data = '';
		$file = $type.'_'.$i;
		$numLines = readLong($raw);
		for ($j = 0; $j < $numLines; $j++)
		{
			$len = readShort($raw);
			$str = fread($raw, $len);
			$data .= "$str\r\n";
			foreach ($tokens as $token)
				if (preg_match('/\['.$token.':(.*?)\]/', $str, $x))
					$file = $x[1];
		}
		echo "$file...\n";
		file_put_contents($file .'.txt', $data);
	}
}

if ($version >= 1372)
	extractList($raw, 'material', array('INORGANIC'));

if ($version >= 1441)
	extractList($raw, 'plant', array('PLANT'));

if ($version >= 1390)
	extractList($raw, 'item', array('ITEM_.*?'));

extractList($raw, 'creature', array('CREATURE'));

if ($version >= 1441)
	extractList($raw, 'entity', array('ENTITY'));

if ($version >= 1484)
	extractList($raw, 'reaction', array('REACTION'));

if ($version >= 1372)
	extractList($raw, 'interaction', array('INTERACTION'));

if ($version >= 1423)
	extractList($raw, 'language', array('TRANSLATION'));

echo "done!\n";
?>