2020-02-26 05:43:55 +03:00
/*
* Copyright ( c ) 2020 , Fei Wu < f . eiwu @ yahoo . com >
*
2021-04-22 11:24:48 +03:00
* SPDX - License - Identifier : BSD - 2 - Clause
2020-02-26 05:43:55 +03:00
*/
2022-12-04 21:02:33 +03:00
# include <AK/DeprecatedString.h>
2020-05-26 14:52:44 +03:00
# include <AK/LexicalPath.h>
2021-06-11 20:38:56 +03:00
# include <AK/NumberFormat.h>
2020-02-26 05:43:55 +03:00
# include <AK/Vector.h>
# include <LibCore/ArgsParser.h>
# include <LibCore/DateTime.h>
# include <LibCore/DirIterator.h>
2023-02-09 05:02:46 +03:00
# include <LibCore/File.h>
2021-12-18 20:59:15 +03:00
# include <LibCore/System.h>
# include <LibMain/Main.h>
2020-02-26 05:43:55 +03:00
# include <limits.h>
# include <string.h>
struct DuOption {
enum class TimeType {
NotUsed ,
Modification ,
Access ,
Status
} ;
2021-06-11 20:38:56 +03:00
bool human_readable = false ;
2023-01-10 15:08:57 +03:00
bool human_readable_si = false ;
2020-02-26 05:43:55 +03:00
bool all = false ;
bool apparent_size = false ;
2022-07-23 19:25:21 +03:00
i64 threshold = 0 ;
2020-02-26 05:43:55 +03:00
TimeType time_type = TimeType : : NotUsed ;
2022-12-04 21:02:33 +03:00
Vector < DeprecatedString > excluded_patterns ;
2022-07-23 19:25:21 +03:00
u64 block_size = 1024 ;
2022-07-23 11:37:29 +03:00
size_t max_depth = SIZE_MAX ;
2020-02-26 05:43:55 +03:00
} ;
2022-12-04 21:02:33 +03:00
static ErrorOr < void > parse_args ( Main : : Arguments arguments , Vector < DeprecatedString > & files , DuOption & du_option ) ;
static ErrorOr < u64 > print_space_usage ( DeprecatedString const & path , DuOption const & du_option , size_t current_depth , bool inside_dir = false ) ;
2020-02-26 05:43:55 +03:00
2021-12-18 20:59:15 +03:00
ErrorOr < int > serenity_main ( Main : : Arguments arguments )
2020-02-26 05:43:55 +03:00
{
2022-12-04 21:02:33 +03:00
Vector < DeprecatedString > files ;
2020-02-26 05:43:55 +03:00
DuOption du_option ;
2022-07-23 11:37:29 +03:00
TRY ( parse_args ( arguments , files , du_option ) ) ;
2020-02-26 05:43:55 +03:00
2022-04-01 20:58:27 +03:00
for ( auto const & file : files )
2022-07-23 11:37:29 +03:00
TRY ( print_space_usage ( file , du_option , 0 ) ) ;
2020-02-26 05:43:55 +03:00
return 0 ;
}
2022-12-04 21:02:33 +03:00
ErrorOr < void > parse_args ( Main : : Arguments arguments , Vector < DeprecatedString > & files , DuOption & du_option )
2020-02-26 05:43:55 +03:00
{
bool summarize = false ;
2022-09-14 14:02:33 +03:00
StringView pattern ;
StringView exclude_from ;
2022-01-02 19:10:00 +03:00
Vector < StringView > files_to_process ;
2020-02-26 05:43:55 +03:00
Core : : ArgsParser : : Option time_option {
2022-07-12 23:13:38 +03:00
Core : : ArgsParser : : OptionArgumentMode : : Required ,
2020-02-26 05:43:55 +03:00
" Show time of type time-type of any file in the directory, or any of its subdirectories. "
" Available choices: mtime, modification, ctime, status, use, atime, access " ,
" time " ,
0 ,
" time-type " ,
2022-07-11 22:53:29 +03:00
[ & du_option ] ( auto const * option_ptr ) {
StringView option { option_ptr , strlen ( option_ptr ) } ;
if ( option = = " mtime " sv | | option = = " modification " sv )
2020-02-26 05:43:55 +03:00
du_option . time_type = DuOption : : TimeType : : Modification ;
2022-07-11 22:53:29 +03:00
else if ( option = = " ctime " sv | | option = = " status " sv | | option = = " use " sv )
2020-02-26 05:43:55 +03:00
du_option . time_type = DuOption : : TimeType : : Status ;
2022-07-11 22:53:29 +03:00
else if ( option = = " atime " sv | | option = = " access " sv )
2020-02-26 05:43:55 +03:00
du_option . time_type = DuOption : : TimeType : : Access ;
else
return false ;
return true ;
}
} ;
2022-07-21 00:10:08 +03:00
Core : : ArgsParser : : Option block_size_1k_option {
Core : : ArgsParser : : OptionArgumentMode : : None ,
" Equivalent to `--block-size 1024` " ,
nullptr ,
' k ' ,
nullptr ,
[ & du_option ] ( auto const * ) {
du_option . block_size = 1024 ;
return true ;
}
} ;
2020-02-26 05:43:55 +03:00
Core : : ArgsParser args_parser ;
2020-12-05 18:22:58 +03:00
args_parser . set_general_help ( " Display actual or apparent disk usage of files or directories. " ) ;
2020-02-26 05:43:55 +03:00
args_parser . add_option ( du_option . all , " Write counts for all files, not just directories " , " all " , ' a ' ) ;
args_parser . add_option ( du_option . apparent_size , " Print apparent sizes, rather than disk usage " , " apparent-size " , 0 ) ;
2021-06-11 20:38:56 +03:00
args_parser . add_option ( du_option . human_readable , " Print human-readable sizes " , " human-readable " , ' h ' ) ;
2023-01-10 15:08:57 +03:00
args_parser . add_option ( du_option . human_readable_si , " Print human-readable sizes in SI units " , " si " , 0 ) ;
2022-07-23 11:37:29 +03:00
args_parser . add_option ( du_option . max_depth , " Print the total for a directory or file only if it is N or fewer levels below the command line argument " , " max-depth " , ' d ' , " N " ) ;
2020-02-26 05:43:55 +03:00
args_parser . add_option ( summarize , " Display only a total for each argument " , " summarize " , ' s ' ) ;
args_parser . add_option ( du_option . threshold , " Exclude entries smaller than size if positive, or entries greater than size if negative " , " threshold " , ' t ' , " size " ) ;
args_parser . add_option ( move ( time_option ) ) ;
args_parser . add_option ( pattern , " Exclude files that match pattern " , " exclude " , 0 , " pattern " ) ;
2022-07-23 11:43:20 +03:00
args_parser . add_option ( exclude_from , " Exclude files that match any pattern in file " , " exclude-from " , ' X ' , " file " ) ;
2022-07-21 00:00:34 +03:00
args_parser . add_option ( du_option . block_size , " Outputs file sizes as the required blocks with the given size (defaults to 1024) " , " block-size " , ' B ' , " size " ) ;
2022-07-21 00:10:08 +03:00
args_parser . add_option ( move ( block_size_1k_option ) ) ;
2020-02-26 05:43:55 +03:00
args_parser . add_positional_argument ( files_to_process , " File to process " , " file " , Core : : ArgsParser : : Required : : No ) ;
2021-12-18 20:59:15 +03:00
args_parser . parse ( arguments ) ;
2020-02-26 05:43:55 +03:00
if ( summarize )
2022-07-23 11:37:29 +03:00
du_option . max_depth = 0 ;
2020-02-26 05:43:55 +03:00
2022-09-14 14:02:33 +03:00
if ( ! pattern . is_empty ( ) )
2020-02-26 05:43:55 +03:00
du_option . excluded_patterns . append ( pattern ) ;
2022-09-14 14:02:33 +03:00
if ( ! exclude_from . is_empty ( ) ) {
2023-02-09 05:02:46 +03:00
auto file = TRY ( Core : : File : : open ( exclude_from , Core : : File : : OpenMode : : Read ) ) ;
2022-12-11 19:49:00 +03:00
auto const buff = TRY ( file - > read_until_eof ( ) ) ;
2021-05-16 09:47:46 +03:00
if ( ! buff . is_empty ( ) ) {
2022-12-04 21:02:33 +03:00
DeprecatedString patterns = DeprecatedString : : copy ( buff , Chomp ) ;
2021-06-12 14:24:45 +03:00
du_option . excluded_patterns . extend ( patterns . split ( ' \n ' ) ) ;
2020-02-26 05:43:55 +03:00
}
}
2022-01-02 19:10:00 +03:00
for ( auto const & file : files_to_process ) {
2020-02-26 05:43:55 +03:00
files . append ( file ) ;
}
if ( files . is_empty ( ) ) {
files . append ( " . " ) ;
}
2021-12-18 20:59:15 +03:00
return { } ;
2020-02-26 05:43:55 +03:00
}
2022-12-04 21:02:33 +03:00
ErrorOr < u64 > print_space_usage ( DeprecatedString const & path , DuOption const & du_option , size_t current_depth , bool inside_dir )
2020-02-26 05:43:55 +03:00
{
2022-07-23 19:36:03 +03:00
u64 size = 0 ;
2022-07-11 23:44:47 +03:00
struct stat path_stat = TRY ( Core : : System : : lstat ( path ) ) ;
2022-04-01 20:58:27 +03:00
bool const is_directory = S_ISDIR ( path_stat . st_mode ) ;
2022-07-23 11:37:29 +03:00
if ( is_directory ) {
2020-02-26 05:43:55 +03:00
auto di = Core : : DirIterator ( path , Core : : DirIterator : : SkipParentAndBaseDir ) ;
if ( di . has_error ( ) ) {
2021-12-18 20:59:15 +03:00
outln ( " du: cannot read directory '{}': {} " , path , di . error_string ( ) ) ;
2022-07-11 20:57:32 +03:00
return Error : : from_string_literal ( " An error occurred. See previous error. " ) ;
2020-02-26 05:43:55 +03:00
}
2021-12-18 20:59:15 +03:00
2020-02-26 05:43:55 +03:00
while ( di . has_next ( ) ) {
2022-04-01 20:58:27 +03:00
auto const child_path = di . next_full_path ( ) ;
2022-07-23 19:36:03 +03:00
size + = TRY ( print_space_usage ( child_path , du_option , current_depth + 1 , true ) ) ;
2020-02-26 05:43:55 +03:00
}
}
2022-04-01 20:58:27 +03:00
auto const basename = LexicalPath : : basename ( path ) ;
for ( auto const & pattern : du_option . excluded_patterns ) {
2020-02-26 05:43:55 +03:00
if ( basename . matches ( pattern , CaseSensitivity : : CaseSensitive ) )
2022-01-02 19:10:00 +03:00
return { 0 } ;
2020-02-26 05:43:55 +03:00
}
2022-07-21 00:02:35 +03:00
if ( ! du_option . apparent_size ) {
2022-01-02 19:10:00 +03:00
constexpr auto block_size = 512 ;
2022-07-23 19:36:03 +03:00
size + = path_stat . st_blocks * block_size ;
} else {
size + = path_stat . st_size ;
2020-02-26 05:43:55 +03:00
}
2022-07-23 19:45:53 +03:00
bool is_beyond_depth = current_depth > du_option . max_depth ;
bool is_inner_file = inside_dir & & ! is_directory ;
bool is_outside_threshold = ( du_option . threshold > 0 & & size < static_cast < u64 > ( du_option . threshold ) ) | | ( du_option . threshold < 0 & & size > static_cast < u64 > ( - du_option . threshold ) ) ;
2020-02-26 05:43:55 +03:00
2022-07-23 19:45:53 +03:00
// All of these still count towards the full size, they are just not reported on individually.
if ( is_beyond_depth | | ( is_inner_file & & ! du_option . all ) | | is_outside_threshold )
return size ;
2022-07-23 11:37:29 +03:00
2021-06-11 20:38:56 +03:00
if ( du_option . human_readable ) {
out ( " {} " , human_readable_size ( size ) ) ;
2023-01-10 15:08:57 +03:00
} else if ( du_option . human_readable_si ) {
out ( " {} " , human_readable_size ( size , AK : : HumanReadableBasedOn : : Base10 ) ) ;
2021-06-11 20:38:56 +03:00
} else {
2022-07-23 19:36:03 +03:00
out ( " {} " , ceil_div ( size , du_option . block_size ) ) ;
2021-06-11 20:38:56 +03:00
}
2020-02-26 05:43:55 +03:00
2021-06-11 20:38:56 +03:00
if ( du_option . time_type = = DuOption : : TimeType : : NotUsed ) {
outln ( " \t {} " , path ) ;
} else {
2020-02-26 05:43:55 +03:00
auto time = path_stat . st_mtime ;
switch ( du_option . time_type ) {
case DuOption : : TimeType : : Access :
time = path_stat . st_atime ;
break ;
case DuOption : : TimeType : : Status :
time = path_stat . st_ctime ;
2021-07-05 20:17:08 +03:00
break ;
2020-02-26 05:43:55 +03:00
default :
break ;
}
2022-12-06 04:12:49 +03:00
auto const formatted_time = Core : : DateTime : : from_timestamp ( time ) . to_deprecated_string ( ) ;
2021-06-11 20:38:56 +03:00
outln ( " \t {} \t {} " , formatted_time , path ) ;
2020-02-26 05:43:55 +03:00
}
2022-01-02 19:10:00 +03:00
return { size } ;
2020-02-26 05:43:55 +03:00
}