2025-02-21 11:31:04 +01:00
|
|
|
/* Lziprecover - Data recovery tool for the lzip format
|
2025-02-21 11:32:21 +01:00
|
|
|
Copyright (C) 2009-2023 Antonio Diaz Diaz.
|
2025-02-21 10:12:48 +01:00
|
|
|
|
2025-02-21 11:31:04 +01:00
|
|
|
This program is free software: you can redistribute it and/or modify
|
|
|
|
it under the terms of the GNU General Public License as published by
|
|
|
|
the Free Software Foundation, either version 2 of the License, or
|
|
|
|
(at your option) any later version.
|
2025-02-21 10:12:48 +01:00
|
|
|
|
2025-02-21 11:31:04 +01:00
|
|
|
This program is distributed in the hope that it will be useful,
|
|
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
GNU General Public License for more details.
|
2025-02-21 10:12:48 +01:00
|
|
|
|
2025-02-21 11:31:04 +01:00
|
|
|
You should have received a copy of the GNU General Public License
|
|
|
|
along with this program. If not, see <http://www.gnu.org/licenses/>.
|
2025-02-21 10:12:48 +01:00
|
|
|
*/
|
|
|
|
|
|
|
|
#define _FILE_OFFSET_BITS 64
|
|
|
|
|
|
|
|
#include <algorithm>
|
|
|
|
#include <cerrno>
|
|
|
|
#include <cstdio>
|
|
|
|
#include <cstdlib>
|
|
|
|
#include <cstring>
|
|
|
|
#include <string>
|
|
|
|
#include <vector>
|
|
|
|
#include <stdint.h>
|
|
|
|
#include <unistd.h>
|
|
|
|
#include <sys/stat.h>
|
|
|
|
|
|
|
|
#include "lzip.h"
|
|
|
|
#include "decoder.h"
|
2025-02-21 11:29:36 +01:00
|
|
|
#include "lzip_index.h"
|
2025-02-21 10:12:48 +01:00
|
|
|
|
|
|
|
|
|
|
|
namespace {
|
|
|
|
|
2025-02-21 11:31:04 +01:00
|
|
|
bool decompress_member( const int infd, const Pretty_print & pp,
|
|
|
|
const unsigned long long mpos,
|
|
|
|
const unsigned long long outskip,
|
|
|
|
const unsigned long long outend )
|
2025-02-21 10:12:48 +01:00
|
|
|
{
|
2025-02-21 11:26:24 +01:00
|
|
|
Range_decoder rdec( infd );
|
2025-02-21 11:29:36 +01:00
|
|
|
Lzip_header header;
|
|
|
|
rdec.read_data( header.data, Lzip_header::size );
|
2025-02-21 11:26:24 +01:00
|
|
|
if( rdec.finished() ) // End Of File
|
2025-02-21 11:31:04 +01:00
|
|
|
{ pp( "File ends unexpectedly at member header." ); return false; }
|
2025-02-21 11:32:21 +01:00
|
|
|
if( !header.check_magic() ) { pp( bad_magic_msg ); return false; }
|
|
|
|
if( !header.check_version() )
|
2025-02-21 11:31:04 +01:00
|
|
|
{ pp( bad_version( header.version() ) ); return false; }
|
2025-02-21 11:26:24 +01:00
|
|
|
const unsigned dictionary_size = header.dictionary_size();
|
2025-02-21 11:31:04 +01:00
|
|
|
if( !isvalid_ds( dictionary_size ) ) { pp( bad_dict_msg ); return false; }
|
2025-02-21 11:26:24 +01:00
|
|
|
|
2025-02-21 11:28:50 +01:00
|
|
|
if( verbosity >= 2 ) pp();
|
2025-02-21 11:26:24 +01:00
|
|
|
|
|
|
|
LZ_decoder decoder( rdec, dictionary_size, outfd, outskip, outend );
|
|
|
|
const int result = decoder.decode_member( pp );
|
|
|
|
if( result != 0 )
|
|
|
|
{
|
2025-02-21 11:28:50 +01:00
|
|
|
if( verbosity >= 0 && result <= 2 )
|
2025-02-21 10:12:48 +01:00
|
|
|
{
|
2025-02-21 11:26:24 +01:00
|
|
|
pp();
|
|
|
|
std::fprintf( stderr, "%s at pos %llu\n", ( result == 2 ) ?
|
|
|
|
"File ends unexpectedly" : "Decoder error",
|
|
|
|
mpos + rdec.member_position() );
|
2025-02-21 10:12:48 +01:00
|
|
|
}
|
2025-02-21 11:31:04 +01:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
if( decoder.data_position() < outend - outskip )
|
|
|
|
{
|
|
|
|
if( verbosity >= 0 )
|
|
|
|
{ pp(); std::fprintf( stderr,
|
|
|
|
"%sMember at pos %llu contains only %llu bytes of %llu requested.\n",
|
|
|
|
( verbosity >= 2 ) ? "\n" : "", mpos,
|
|
|
|
decoder.data_position() - outskip, outend - outskip ); }
|
|
|
|
return false;
|
2025-02-21 10:12:48 +01:00
|
|
|
}
|
2025-02-21 11:28:50 +01:00
|
|
|
if( verbosity >= 2 ) std::fputs( "done\n", stderr );
|
2025-02-21 11:31:04 +01:00
|
|
|
return true;
|
2025-02-21 10:12:48 +01:00
|
|
|
}
|
|
|
|
|
2025-02-21 11:31:04 +01:00
|
|
|
} // end namespace
|
|
|
|
|
2025-02-21 10:12:48 +01:00
|
|
|
|
2025-02-21 11:23:37 +01:00
|
|
|
const char * format_num( unsigned long long num,
|
2025-02-21 11:31:04 +01:00
|
|
|
unsigned long long limit,
|
|
|
|
const int set_prefix )
|
2025-02-21 11:23:37 +01:00
|
|
|
{
|
|
|
|
const char * const si_prefix[8] =
|
|
|
|
{ "k", "M", "G", "T", "P", "E", "Z", "Y" };
|
|
|
|
const char * const binary_prefix[8] =
|
|
|
|
{ "Ki", "Mi", "Gi", "Ti", "Pi", "Ei", "Zi", "Yi" };
|
2025-02-21 11:25:43 +01:00
|
|
|
enum { buffers = 8, bufsize = 32 };
|
|
|
|
static char buffer[buffers][bufsize]; // circle of static buffers for printf
|
|
|
|
static int current = 0;
|
2025-02-21 11:23:37 +01:00
|
|
|
static bool si = true;
|
|
|
|
|
|
|
|
if( set_prefix ) si = ( set_prefix > 0 );
|
2025-02-21 11:31:04 +01:00
|
|
|
unsigned long long den = 1;
|
2025-02-21 11:23:37 +01:00
|
|
|
const unsigned factor = ( si ? 1000 : 1024 );
|
2025-02-21 11:25:43 +01:00
|
|
|
char * const buf = buffer[current++]; current %= buffers;
|
2025-02-21 11:23:37 +01:00
|
|
|
const char * const * prefix = ( si ? si_prefix : binary_prefix );
|
|
|
|
const char * p = "";
|
|
|
|
|
2025-02-21 11:31:04 +01:00
|
|
|
for( int i = 0; i < 8 && num / den >= factor && den * factor > den; ++i )
|
|
|
|
{ if( num / den <= limit && num % ( den * factor ) != 0 ) break;
|
|
|
|
den *= factor; p = prefix[i]; }
|
|
|
|
if( num % den == 0 )
|
|
|
|
snprintf( buf, bufsize, "%llu %s", num / den, p );
|
|
|
|
else
|
|
|
|
snprintf( buf, bufsize, "%3.2f %s", (double)num / den, p );
|
2025-02-21 11:23:37 +01:00
|
|
|
return buf;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2025-02-21 11:32:21 +01:00
|
|
|
bool safe_seek( const int fd, const long long pos,
|
|
|
|
const char * const filename )
|
2025-02-21 11:16:43 +01:00
|
|
|
{
|
|
|
|
if( lseek( fd, pos, SEEK_SET ) == pos ) return true;
|
2025-02-21 11:32:21 +01:00
|
|
|
show_file_error( filename, "Seek error", errno );
|
|
|
|
return false;
|
2025-02-21 11:16:43 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
|
2025-02-21 10:12:48 +01:00
|
|
|
int range_decompress( const std::string & input_filename,
|
2025-02-21 11:26:24 +01:00
|
|
|
const std::string & default_output_filename,
|
2025-02-21 11:32:21 +01:00
|
|
|
const Cl_options & cl_opts, Block range,
|
|
|
|
const bool force, const bool to_stdout )
|
2025-02-21 10:12:48 +01:00
|
|
|
{
|
2025-02-21 11:32:21 +01:00
|
|
|
const char * const filename = input_filename.c_str();
|
2025-02-21 10:12:48 +01:00
|
|
|
struct stat in_stats;
|
2025-02-21 11:32:21 +01:00
|
|
|
const int infd = open_instream( filename, &in_stats, false, true );
|
2025-02-21 10:12:48 +01:00
|
|
|
if( infd < 0 ) return 1;
|
2025-02-21 11:11:34 +01:00
|
|
|
|
2025-02-21 11:32:21 +01:00
|
|
|
const Lzip_index lzip_index( infd, cl_opts, cl_opts.ignore_errors,
|
|
|
|
cl_opts.ignore_errors );
|
2025-02-21 11:29:36 +01:00
|
|
|
if( lzip_index.retval() != 0 )
|
2025-02-21 11:32:21 +01:00
|
|
|
{ show_file_error( filename, lzip_index.error().c_str() );
|
2025-02-21 11:29:36 +01:00
|
|
|
return lzip_index.retval(); }
|
2025-02-21 10:12:48 +01:00
|
|
|
|
2025-02-21 11:31:04 +01:00
|
|
|
const long long udata_size = lzip_index.udata_size();
|
|
|
|
if( range.end() > udata_size )
|
|
|
|
range.size( std::max( 0LL, udata_size - range.pos() ) );
|
2025-02-21 11:29:36 +01:00
|
|
|
if( range.size() <= 0 )
|
2025-02-21 11:32:21 +01:00
|
|
|
{ if( udata_size > 0 ) show_file_error( filename, "Nothing to do." );
|
2025-02-21 11:31:04 +01:00
|
|
|
return 0; }
|
2025-02-21 10:12:48 +01:00
|
|
|
|
2025-02-21 11:31:04 +01:00
|
|
|
if( to_stdout || default_output_filename.empty() ) outfd = STDOUT_FILENO;
|
2025-02-21 10:12:48 +01:00
|
|
|
else
|
2025-02-21 11:26:24 +01:00
|
|
|
{
|
|
|
|
output_filename = default_output_filename;
|
2025-02-21 11:29:36 +01:00
|
|
|
set_signal_handler();
|
2025-02-21 11:31:04 +01:00
|
|
|
if( !open_outstream( force, true, false, false ) ) return 1;
|
2025-02-21 11:26:24 +01:00
|
|
|
}
|
2025-02-21 11:16:43 +01:00
|
|
|
|
2025-02-21 11:29:36 +01:00
|
|
|
if( verbosity >= 1 )
|
2025-02-21 11:31:04 +01:00
|
|
|
std::fprintf( stderr, "Decompressing range %sB to %sB (%sB of %sBytes)\n",
|
2025-02-21 11:29:36 +01:00
|
|
|
format_num( range.pos() ),
|
|
|
|
format_num( range.pos() + range.size() ),
|
2025-02-21 11:31:04 +01:00
|
|
|
format_num( range.size() ), format_num( udata_size ) );
|
2025-02-21 11:29:36 +01:00
|
|
|
|
|
|
|
Pretty_print pp( input_filename );
|
2025-02-21 11:31:04 +01:00
|
|
|
bool error = false;
|
2025-02-21 11:29:36 +01:00
|
|
|
for( long i = 0; i < lzip_index.members(); ++i )
|
2025-02-21 10:12:48 +01:00
|
|
|
{
|
2025-02-21 11:29:36 +01:00
|
|
|
const Block & db = lzip_index.dblock( i );
|
2025-02-21 10:12:48 +01:00
|
|
|
if( range.overlaps( db ) )
|
|
|
|
{
|
2025-02-21 11:29:36 +01:00
|
|
|
if( verbosity >= 3 && lzip_index.members() > 1 )
|
2025-02-21 11:20:27 +01:00
|
|
|
std::fprintf( stderr, "Decompressing member %3ld\n", i + 1 );
|
2025-02-21 10:12:48 +01:00
|
|
|
const long long outskip = std::max( 0LL, range.pos() - db.pos() );
|
2025-02-21 11:13:34 +01:00
|
|
|
const long long outend = std::min( db.size(), range.end() - db.pos() );
|
2025-02-21 11:29:36 +01:00
|
|
|
const long long mpos = lzip_index.mblock( i ).pos();
|
2025-02-21 11:32:21 +01:00
|
|
|
if( !safe_seek( infd, mpos, filename ) ) cleanup_and_fail( 1 );
|
2025-02-21 11:31:04 +01:00
|
|
|
if( !decompress_member( infd, pp, mpos, outskip, outend ) )
|
2025-02-21 11:32:21 +01:00
|
|
|
{ if( cl_opts.ignore_errors ) error = true; else cleanup_and_fail( 2 ); }
|
2025-02-21 10:12:48 +01:00
|
|
|
pp.reset();
|
|
|
|
}
|
|
|
|
}
|
2025-02-21 11:32:21 +01:00
|
|
|
if( close( infd ) != 0 )
|
|
|
|
{ show_file_error( filename, "Error closing input file", errno );
|
|
|
|
cleanup_and_fail( 1 ); }
|
2025-02-21 11:31:04 +01:00
|
|
|
if( close_outstream( &in_stats ) != 0 ) cleanup_and_fail( 1 );
|
|
|
|
if( verbosity >= 2 && !error )
|
2025-02-21 11:25:43 +01:00
|
|
|
std::fputs( "Byte range decompressed successfully.\n", stderr );
|
2025-02-21 11:31:04 +01:00
|
|
|
return 0; // either no error or ignored
|
2025-02-21 10:12:48 +01:00
|
|
|
}
|