2020-02-05 15:36:59 -07:00
# include "Console.h"
# include "PluginManager.h"
# include "MemAccess.h"
# include "DataDefs.h"
# include "DataIdentity.h"
2020-02-14 18:47:26 -07:00
# include "LuaTools.h"
# include "LuaWrapper.h"
2020-02-05 15:36:59 -07:00
2020-02-29 14:08:39 -07:00
# include "df/large_integer.h"
2020-02-05 19:29:16 -07:00
# if defined(WIN32) && defined(DFHACK64)
# define _WIN32_WINNT 0x0501
# define WINVER 0x0501
# define WIN32_LEAN_AND_MEAN
2020-02-05 20:47:25 -07:00
# include <windows.h>
2020-02-05 19:29:16 -07:00
# endif
2020-02-15 11:54:04 -07:00
# include <deque>
2020-02-29 13:18:27 -07:00
# include <inttypes.h>
2020-02-05 15:36:59 -07:00
# include <set>
# include <typeinfo>
using namespace DFHack ;
DFHACK_PLUGIN ( " check-structures-sanity " ) ;
static command_result command ( color_ostream & , std : : vector < std : : string > & ) ;
# ifdef WIN32
# define UNEXPECTED __debugbreak()
# else
# define UNEXPECTED __asm__ volatile ("int $0x03")
# endif
2020-03-02 20:33:04 -07:00
# define MIN_SIZE_FOR_SUGGEST 64
static std : : map < size_t , std : : vector < std : : string > > known_types_by_size ;
static void build_size_table ( ) ;
2020-02-14 18:47:26 -07:00
DFhackCExport command_result plugin_init ( color_ostream & , std : : vector < PluginCommand > & commands )
2020-02-05 15:36:59 -07:00
{
commands . push_back ( PluginCommand (
" check-structures-sanity " ,
" performs a sanity check on df-structures " ,
command ,
false ,
2020-03-01 11:15:26 -07:00
" check-structures-sanity [-enums] [-sizes] [-lowmem] [-maxerrors n] [-failfast] [starting_point] \n "
2020-02-14 18:47:26 -07:00
" \n "
2020-02-15 11:54:04 -07:00
" -enums: report unexpected or unnamed enum or bitfield values. \n "
" -sizes: report struct and class sizes that don't match structures. (requires sizecheck) \n "
2020-03-01 11:15:26 -07:00
" -lowmem: use depth-first search instead of breadth-first search. uses less memory but processes fields in a less intuitive order. \n "
" -maxerrors n: set the maximum number of errors before bailing out. \n "
" -failfast: crash if any error is encountered. useful only for debugging. \n "
2020-02-15 11:54:04 -07:00
" starting_point: a lua expression or a word like 'screen', 'item', or 'building'. (defaults to df.global) \n "
2020-02-14 18:47:26 -07:00
" \n "
2020-02-15 11:54:04 -07:00
" by default, check-structures-sanity reports invalid pointers, vectors, strings, and vtables. "
2020-02-05 15:36:59 -07:00
) ) ;
2020-03-02 20:33:04 -07:00
known_types_by_size . clear ( ) ;
build_size_table ( ) ;
2020-02-05 15:36:59 -07:00
return CR_OK ;
}
2020-03-02 20:33:04 -07:00
static void build_size_table ( )
{
for ( auto & ident : compound_identity : : getTopScope ( ) )
{
if ( ident - > byte_size ( ) > = MIN_SIZE_FOR_SUGGEST )
{
known_types_by_size [ ident - > byte_size ( ) ] . push_back ( ident - > getFullName ( ) ) ;
}
}
}
2020-03-06 18:28:14 -07:00
static bool is_df_linked_list ( type_identity * type )
{
if ( type - > type ( ) ! = IDTYPE_STRUCT )
return false ;
auto struct_type = static_cast < struct_identity * > ( type ) ;
auto fields = struct_type - > getFields ( ) ;
if ( fields [ 0 ] . mode ! = struct_field_info : : POINTER )
return false ;
if ( strcmp ( fields [ 0 ] . name , " item " ) )
return false ;
if ( fields [ 1 ] . mode ! = struct_field_info : : POINTER )
return false ;
if ( fields [ 1 ] . type ! = type )
return false ;
if ( strcmp ( fields [ 1 ] . name , " prev " ) )
return false ;
if ( fields [ 2 ] . mode ! = struct_field_info : : POINTER )
return false ;
if ( fields [ 2 ] . type ! = type )
return false ;
if ( strcmp ( fields [ 2 ] . name , " next " ) )
return false ;
return fields [ 3 ] . mode = = struct_field_info : : END ;
}
2020-02-29 13:18:27 -07:00
static const char * const * get_enum_item_key ( enum_identity * identity , int64_t value )
{
size_t index ;
if ( auto cplx = identity - > getComplex ( ) )
{
auto it = cplx - > value_index_map . find ( value ) ;
if ( it = = cplx - > value_index_map . cend ( ) )
{
return nullptr ;
}
index = it - > second ;
}
else
{
if ( value < identity - > getFirstItem ( ) | | value > identity - > getLastItem ( ) )
{
return nullptr ;
}
index = value - identity - > getFirstItem ( ) ;
}
return & identity - > getKeys ( ) [ index ] ;
}
2020-02-09 13:16:19 -07:00
struct ToCheck
{
std : : vector < std : : string > path ;
void * ptr ;
type_identity * identity ;
std : : unique_ptr < type_identity > temp_identity ;
ToCheck ( )
{
}
ToCheck ( const ToCheck & parent , size_t idx , void * ptr , type_identity * identity ) :
ToCheck ( parent , stl_sprintf ( " [%zu] " , idx ) , ptr , identity )
{
}
ToCheck ( const ToCheck & parent , const std : : string & name , void * ptr , type_identity * identity ) :
path ( parent . path . cbegin ( ) , parent . path . cend ( ) ) ,
ptr ( ptr ) ,
identity ( identity )
{
path . push_back ( name ) ;
}
} ;
2020-02-05 15:36:59 -07:00
class Checker
{
color_ostream & out ;
std : : vector < t_memrange > mapped ;
std : : set < void * > seen_addr ;
2020-02-09 13:16:19 -07:00
public :
2020-02-15 11:54:04 -07:00
std : : deque < ToCheck > queue ;
size_t num_checked ;
2020-02-14 18:47:26 -07:00
bool enums ;
bool sizes ;
2020-02-15 11:54:04 -07:00
bool lowmem ;
2020-03-01 11:15:26 -07:00
bool failfast ;
size_t maxerrors ;
2020-02-09 13:16:19 -07:00
private :
2020-02-05 15:36:59 -07:00
bool ok ;
2020-02-22 14:34:48 -07:00
# ifndef WIN32
// this function doesn't make sense on windows, where std::string is not pointer-sized.
const std : : string * check_possible_stl_string_pointer ( const void * const * ) ;
# endif
2020-02-09 13:16:19 -07:00
bool check_access ( const ToCheck & , void * , type_identity * ) ;
bool check_access ( const ToCheck & , void * , type_identity * , size_t ) ;
2020-03-02 14:34:29 -07:00
const char * check_vtable ( const ToCheck & , void * , type_identity * ) ;
2020-02-09 13:16:19 -07:00
void queue_field ( ToCheck & & , const struct_field_info * ) ;
2020-02-09 14:12:25 -07:00
void queue_static_array ( const ToCheck & , void * , type_identity * , size_t , bool = false , enum_identity * = nullptr ) ;
2020-02-29 17:28:14 -07:00
bool maybe_queue_union ( const ToCheck & , const struct_field_info * , const struct_field_info * ) ;
void queue_union ( const ToCheck & , const ToCheck & ) ;
void queue_union_vector ( const ToCheck & , const ToCheck & ) ;
2020-03-06 15:48:33 -07:00
void queue_union_bitvector ( const ToCheck & , const ToCheck & ) ;
2020-03-06 16:53:05 -07:00
void queue_df_linked_list ( const ToCheck & ) ;
2020-02-29 13:18:27 -07:00
void check_dispatch ( ToCheck & ) ;
2020-02-09 13:16:19 -07:00
void check_global ( const ToCheck & ) ;
void check_primitive ( const ToCheck & ) ;
void check_stl_string ( const ToCheck & ) ;
void check_pointer ( const ToCheck & ) ;
void check_bitfield ( const ToCheck & ) ;
2020-02-20 21:17:25 -07:00
int64_t check_enum ( const ToCheck & ) ;
2020-02-09 13:16:19 -07:00
void check_container ( const ToCheck & ) ;
2020-02-29 17:28:14 -07:00
size_t check_vector_size ( const ToCheck & , size_t ) ;
2020-02-09 13:16:19 -07:00
void check_vector ( const ToCheck & , type_identity * , bool ) ;
void check_deque ( const ToCheck & , type_identity * ) ;
void check_dfarray ( const ToCheck & , type_identity * ) ;
void check_bitarray ( const ToCheck & ) ;
2020-03-06 15:48:33 -07:00
bool check_bitvector ( const ToCheck & ) ;
2020-02-09 13:16:19 -07:00
void check_struct ( const ToCheck & ) ;
void check_virtual ( const ToCheck & ) ;
2020-02-05 15:36:59 -07:00
public :
Checker ( color_ostream & ) ;
bool check ( ) ;
} ;
static command_result command ( color_ostream & out , std : : vector < std : : string > & parameters )
{
2020-02-14 18:47:26 -07:00
CoreSuspender suspend ;
Checker checker ( out ) ;
2020-03-01 11:15:26 -07:00
// check parameters with values first
# define VAL_PARAM(name, expr_using_value) \
auto name # # _idx = std : : find ( parameters . begin ( ) , parameters . end ( ) , " - " # name ) ; \
if ( name # # _idx ! = parameters . end ( ) ) \
{ \
if ( name # # _idx + 1 = = parameters . end ( ) ) \
{ \
return CR_WRONG_USAGE ; \
} \
try \
{ \
auto value = std : : move ( * ( name # # _idx + 1 ) ) ; \
parameters . erase ( ( name # # _idx + 1 ) ) ; \
parameters . erase ( name # # _idx ) ; \
checker . name = ( expr_using_value ) ; \
} \
catch ( std : : exception & ex ) \
{ \
out . printerr ( " check-structures-sanity: argument to -%s: %s \n " , # name , ex . what ( ) ) ; \
return CR_WRONG_USAGE ; \
} \
}
VAL_PARAM ( maxerrors , std : : stoul ( value ) ) ;
# undef VAL_PARAM
2020-02-14 18:47:26 -07:00
# define BOOL_PARAM(name) \
2020-02-15 17:17:30 -07:00
auto name # # _idx = std : : find ( parameters . begin ( ) , parameters . end ( ) , " - " # name ) ; \
2020-03-01 11:15:26 -07:00
if ( name # # _idx ! = parameters . end ( ) ) \
2020-02-14 18:47:26 -07:00
{ \
checker . name = true ; \
parameters . erase ( name # # _idx ) ; \
}
BOOL_PARAM ( enums ) ;
BOOL_PARAM ( sizes ) ;
2020-02-15 11:54:04 -07:00
BOOL_PARAM ( lowmem ) ;
2020-03-01 11:15:26 -07:00
BOOL_PARAM ( failfast ) ;
2020-02-14 18:47:26 -07:00
# undef BOOL_PARAM
if ( parameters . size ( ) > 1 )
2020-02-05 15:36:59 -07:00
{
return CR_WRONG_USAGE ;
}
2020-02-14 18:47:26 -07:00
if ( parameters . empty ( ) )
{
ToCheck global ;
2020-02-21 16:31:22 -07:00
global . path . push_back ( " df.global. " ) ;
2020-02-14 18:47:26 -07:00
global . ptr = nullptr ;
global . identity = & df : : global : : _identity ;
2020-02-05 15:36:59 -07:00
2020-02-15 11:54:04 -07:00
checker . queue . push_back ( std : : move ( global ) ) ;
2020-02-14 18:47:26 -07:00
}
else
{
using namespace DFHack : : Lua ;
using namespace DFHack : : Lua : : Core ;
using namespace DFHack : : LuaWrapper ;
2020-02-05 15:36:59 -07:00
2020-02-14 18:47:26 -07:00
StackUnwinder unwinder ( State ) ;
PushModulePublic ( out , " utils " , " df_expr_to_ref " ) ;
2020-02-15 01:42:44 -07:00
Push ( parameters . at ( 0 ) ) ;
2020-02-14 18:47:26 -07:00
if ( ! SafeCall ( out , 1 , 1 ) )
{
return CR_FAILURE ;
}
2020-02-15 11:04:00 -07:00
if ( ! lua_touserdata ( State , - 1 ) )
{
return CR_WRONG_USAGE ;
}
2020-02-09 13:16:19 -07:00
2020-02-14 18:47:26 -07:00
ToCheck ref ;
ref . path . push_back ( parameters . at ( 0 ) ) ;
ref . ptr = get_object_ref ( State , - 1 ) ;
2020-02-15 01:42:44 -07:00
lua_getfield ( State , - 1 , " _type " ) ;
lua_getfield ( State , - 1 , " _identity " ) ;
ref . identity = reinterpret_cast < type_identity * > ( lua_touserdata ( State , - 1 ) ) ;
2020-02-14 18:47:26 -07:00
if ( ! ref . identity )
{
2020-02-19 10:40:31 -07:00
out . printerr ( " could not determine type identity \n " ) ;
2020-02-14 18:47:26 -07:00
return CR_FAILURE ;
}
2020-02-15 11:54:04 -07:00
checker . queue . push_back ( std : : move ( ref ) ) ;
2020-02-14 18:47:26 -07:00
}
2020-02-09 13:16:19 -07:00
2020-02-05 15:36:59 -07:00
return checker . check ( ) ? CR_OK : CR_FAILURE ;
}
Checker : : Checker ( color_ostream & out ) :
out ( out )
{
Core : : getInstance ( ) . p - > getMemRanges ( mapped ) ;
2020-02-14 18:47:26 -07:00
enums = false ;
sizes = false ;
2020-02-15 15:10:30 -07:00
lowmem = false ;
2020-03-01 11:15:26 -07:00
failfast = false ;
maxerrors = ~ size_t ( 0 ) ;
2020-02-05 15:36:59 -07:00
}
bool Checker : : check ( )
{
seen_addr . clear ( ) ;
2020-02-15 11:54:04 -07:00
num_checked = 0 ;
2020-02-05 15:36:59 -07:00
ok = true ;
2020-02-09 13:16:19 -07:00
while ( ! queue . empty ( ) )
{
2020-03-01 11:15:26 -07:00
if ( ! maxerrors )
{
out < < " hit max error count. bailing out with " < < queue . size ( ) < < " fields in queue. " < < std : : endl ;
break ;
}
2020-02-15 11:54:04 -07:00
ToCheck current ;
if ( lowmem )
{
current = std : : move ( queue . back ( ) ) ;
queue . pop_back ( ) ;
}
else
{
current = std : : move ( queue . front ( ) ) ;
queue . pop_front ( ) ;
}
2020-02-05 15:36:59 -07:00
2020-02-09 13:16:19 -07:00
check_dispatch ( current ) ;
2020-02-15 11:54:04 -07:00
num_checked + + ;
if ( out . is_console ( ) & & num_checked % 1000 = = 0 )
{
out < < " checked " < < num_checked < < " fields \r " < < std : : flush ;
}
2020-02-09 13:16:19 -07:00
}
2020-02-05 15:36:59 -07:00
2020-02-15 11:54:04 -07:00
out < < " checked " < < num_checked < < " fields " < < std : : endl ;
2020-02-09 13:16:19 -07:00
return ok ;
2020-02-05 15:36:59 -07:00
}
# define FAIL(message) \
do \
{ \
ok = false ; \
out < < COLOR_LIGHTRED < < " sanity check failed (line " < < __LINE__ < < " ): " ; \
2020-02-09 13:16:19 -07:00
out < < COLOR_RESET < < ( item . identity ? item . identity - > getFullName ( ) : " ? " ) < < " (accessed as " ; \
for ( auto & p : item . path ) { out < < p ; } \
2020-02-05 15:36:59 -07:00
out < < " ): " ; \
out < < COLOR_YELLOW < < message ; \
out < < COLOR_RESET < < std : : endl ; \
2020-03-01 11:15:26 -07:00
if ( maxerrors & & maxerrors ! = ~ size_t ( 0 ) ) \
maxerrors - - ; \
if ( failfast ) \
UNEXPECTED ; \
2020-02-05 15:36:59 -07:00
} while ( false )
# define PTR_ADD(base, offset) (reinterpret_cast<void *>(reinterpret_cast<uintptr_t>((base)) + static_cast<ptrdiff_t>((offset))))
2020-02-22 14:34:48 -07:00
# ifndef WIN32
const std : : string * Checker : : check_possible_stl_string_pointer ( const void * const * base )
{
std : : string empty_string ;
if ( * base = = * reinterpret_cast < void * * > ( & empty_string ) )
{
return reinterpret_cast < const std : : string * > ( base ) ;
}
const struct string_data_inner
{
size_t length ;
size_t capacity ;
int32_t refcount ;
} * str_data = static_cast < const string_data_inner * > ( * base ) - 1 ;
2020-02-23 20:33:32 -07:00
uint32_t tag = * reinterpret_cast < const uint32_t * > ( PTR_ADD ( str_data , - 8 ) ) ;
if ( tag = = 0xdfdf4ac8 )
2020-02-22 14:34:48 -07:00
{
2020-02-23 20:33:32 -07:00
size_t allocated_size = * reinterpret_cast < const size_t * > ( PTR_ADD ( str_data , - 16 ) ) ;
size_t expected_size = sizeof ( * str_data ) + str_data - > capacity + 1 ;
2020-02-22 14:34:48 -07:00
2020-02-23 20:33:32 -07:00
if ( allocated_size ! = expected_size )
2020-02-22 14:34:48 -07:00
{
return nullptr ;
}
}
2020-02-23 20:33:32 -07:00
else
2020-02-22 14:34:48 -07:00
{
return nullptr ;
}
if ( str_data - > capacity < str_data - > length )
{
return nullptr ;
}
const char * ptr = reinterpret_cast < const char * > ( * base ) ;
for ( size_t i = 0 ; i < str_data - > length ; i + + )
{
if ( ! * ptr + + )
{
return nullptr ;
}
}
if ( * ptr + + )
{
return nullptr ;
}
return reinterpret_cast < const std : : string * > ( base ) ;
}
# endif
2020-02-09 13:16:19 -07:00
bool Checker : : check_access ( const ToCheck & item , void * base , type_identity * identity )
2020-02-05 17:24:10 -07:00
{
2020-02-09 13:16:19 -07:00
return check_access ( item , base , identity , identity ? identity - > byte_size ( ) : 0 ) ;
2020-02-05 17:24:10 -07:00
}
2020-02-09 13:16:19 -07:00
bool Checker : : check_access ( const ToCheck & item , void * base , type_identity * identity , size_t size )
2020-02-05 15:36:59 -07:00
{
if ( ! base )
{
// null pointer: can't access, but not an error
return false ;
}
2020-02-09 13:16:19 -07:00
// assumes MALLOC_PERTURB_=45
# ifdef DFHACK64
# define UNINIT_PTR 0xd2d2d2d2d2d2d2d2
# define FAIL_PTR(message) FAIL(stl_sprintf("0x%016zx: ", reinterpret_cast<uintptr_t>(base)) << message)
# else
# define UNINIT_PTR 0xd2d2d2d2
# define FAIL_PTR(message) FAIL(stl_sprintf("0x%08zx: ", reinterpret_cast<uintptr_t>(base)) << message)
# endif
if ( reinterpret_cast < uintptr_t > ( base ) = = UNINIT_PTR )
{
FAIL_PTR ( " uninitialized pointer " ) ;
return false ;
}
2020-02-11 13:11:09 -07:00
bool found = true ;
void * expected_start = base ;
size_t remaining_size = size ;
while ( found )
2020-02-05 15:36:59 -07:00
{
2020-02-11 13:11:09 -07:00
found = false ;
2020-02-05 15:36:59 -07:00
2020-02-11 13:11:09 -07:00
for ( auto & range : mapped )
2020-02-05 15:36:59 -07:00
{
2020-02-11 13:11:09 -07:00
if ( ! range . isInRange ( expected_start ) )
{
continue ;
}
2020-02-05 15:36:59 -07:00
2020-02-11 13:11:09 -07:00
found = true ;
if ( ! range . valid | | ! range . read )
{
FAIL_PTR ( " pointer to invalid memory range " ) ;
return false ;
}
2020-02-05 15:36:59 -07:00
2020-02-11 13:11:09 -07:00
if ( size & & ! range . isInRange ( PTR_ADD ( expected_start , remaining_size - 1 ) ) )
{
void * next_start = PTR_ADD ( range . end , 1 ) ;
remaining_size - = reinterpret_cast < ptrdiff_t > ( next_start ) - reinterpret_cast < ptrdiff_t > ( expected_start ) ;
expected_start = next_start ;
break ;
}
return true ;
}
2020-02-05 15:36:59 -07:00
}
2020-02-11 13:11:09 -07:00
if ( expected_start = = base )
{
FAIL_PTR ( " pointer not in any mapped range " ) ;
}
else
{
FAIL_PTR ( " pointer exceeds mapped memory bounds (size " < < size < < " ) " ) ;
}
2020-02-05 15:36:59 -07:00
return false ;
2020-02-09 13:16:19 -07:00
# undef FAIL_PTR
2020-02-05 15:36:59 -07:00
}
2020-03-02 14:34:29 -07:00
const char * Checker : : check_vtable ( const ToCheck & item , void * vtable , type_identity * identity )
2020-02-05 15:36:59 -07:00
{
2020-02-09 13:16:19 -07:00
if ( ! check_access ( item , PTR_ADD ( vtable , - ptrdiff_t ( sizeof ( void * ) ) ) , identity , sizeof ( void * ) ) )
2020-03-02 14:34:29 -07:00
return nullptr ;
2020-02-05 17:24:10 -07:00
char * * info = * ( reinterpret_cast < char * * * > ( vtable ) - 1 ) ;
# ifdef WIN32
2020-02-09 13:16:19 -07:00
if ( ! check_access ( item , PTR_ADD ( info , 12 ) , identity , 4 ) )
2020-03-02 14:34:29 -07:00
return nullptr ;
2020-02-05 15:36:59 -07:00
2020-02-05 17:24:10 -07:00
# ifdef DFHACK64
void * base ;
if ( ! RtlPcToFileHeader ( info , & base ) )
2020-03-02 14:34:29 -07:00
return nullptr ;
2020-02-05 17:24:10 -07:00
char * typeinfo = reinterpret_cast < char * > ( base ) + reinterpret_cast < int32_t * > ( info ) [ 3 ] ;
char * name = typeinfo + 16 ;
# else
2020-02-05 19:21:32 -07:00
char * name = reinterpret_cast < char * > ( info ) + 8 ;
2020-02-05 17:24:10 -07:00
# endif
# else
2020-02-09 13:16:19 -07:00
if ( ! check_access ( item , info + 1 , identity , sizeof ( void * ) ) )
2020-03-02 14:34:29 -07:00
return nullptr ;
2020-02-05 17:24:10 -07:00
char * name = * ( info + 1 ) ;
# endif
2020-02-05 15:36:59 -07:00
for ( auto & range : mapped )
{
2020-02-05 17:24:10 -07:00
if ( ! range . isInRange ( name ) )
2020-02-05 15:36:59 -07:00
{
continue ;
}
if ( ! range . valid | | ! range . read )
{
2020-02-05 17:24:10 -07:00
FAIL ( " pointer to invalid memory range " ) ;
2020-03-02 14:34:29 -07:00
return nullptr ;
2020-02-05 15:36:59 -07:00
}
2020-02-09 14:12:25 -07:00
bool letter = false ;
2020-02-05 17:24:10 -07:00
for ( char * p = name ; ; p + + )
2020-02-05 15:36:59 -07:00
{
2020-02-05 17:24:10 -07:00
if ( ! range . isInRange ( p ) )
{
2020-03-02 14:34:29 -07:00
return nullptr ;
2020-02-05 17:24:10 -07:00
}
2020-02-05 15:36:59 -07:00
2020-02-09 14:12:25 -07:00
if ( * p > = ' a ' & & * p < = ' z ' )
2020-02-05 17:24:10 -07:00
{
2020-02-09 14:12:25 -07:00
letter = true ;
}
else if ( ! * p )
{
2020-03-02 14:34:29 -07:00
return letter ? name : nullptr ;
2020-02-05 17:24:10 -07:00
}
}
2020-02-05 15:36:59 -07:00
}
2020-03-02 14:34:29 -07:00
return nullptr ;
2020-02-05 15:36:59 -07:00
}
2020-02-09 13:16:19 -07:00
void Checker : : queue_field ( ToCheck & & item , const struct_field_info * field )
2020-02-05 15:36:59 -07:00
{
switch ( field - > mode )
{
case struct_field_info : : END :
2020-02-09 13:16:19 -07:00
UNEXPECTED ;
2020-02-05 15:36:59 -07:00
break ;
case struct_field_info : : PRIMITIVE :
2020-02-15 11:54:04 -07:00
queue . push_back ( std : : move ( item ) ) ;
2020-02-05 15:36:59 -07:00
break ;
case struct_field_info : : STATIC_STRING :
// TODO: check static strings?
break ;
case struct_field_info : : POINTER :
2020-02-29 12:11:23 -07:00
// TODO: flags inside field->count
2020-02-09 13:16:19 -07:00
item . temp_identity = std : : unique_ptr < df : : pointer_identity > ( new df : : pointer_identity ( field - > type ) ) ;
item . identity = item . temp_identity . get ( ) ;
2020-02-15 11:54:04 -07:00
queue . push_back ( std : : move ( item ) ) ;
2020-02-05 15:36:59 -07:00
break ;
case struct_field_info : : STATIC_ARRAY :
2020-02-09 14:12:25 -07:00
queue_static_array ( item , item . ptr , field - > type , field - > count , false , field - > eid ) ;
2020-02-05 15:36:59 -07:00
break ;
case struct_field_info : : SUBSTRUCT :
2020-02-15 11:54:04 -07:00
queue . push_back ( std : : move ( item ) ) ;
2020-02-05 15:36:59 -07:00
break ;
case struct_field_info : : CONTAINER :
2020-03-06 16:53:05 -07:00
if ( field - > type & & field - > type - > type ( ) = = IDTYPE_STRUCT )
queue_df_linked_list ( item ) ;
else
queue . push_back ( std : : move ( item ) ) ;
2020-02-05 15:36:59 -07:00
break ;
case struct_field_info : : STL_VECTOR_PTR :
2020-02-09 13:16:19 -07:00
item . temp_identity = std : : unique_ptr < df : : stl_ptr_vector_identity > ( new df : : stl_ptr_vector_identity ( field - > type , field - > eid ) ) ;
item . identity = item . temp_identity . get ( ) ;
2020-02-15 11:54:04 -07:00
queue . push_back ( std : : move ( item ) ) ;
2020-02-05 15:36:59 -07:00
break ;
case struct_field_info : : OBJ_METHOD :
case struct_field_info : : CLASS_METHOD :
// ignore
break ;
}
}
2020-02-09 14:12:25 -07:00
void Checker : : queue_static_array ( const ToCheck & array , void * base , type_identity * type , size_t count , bool pointer , enum_identity * ienum )
2020-02-05 15:36:59 -07:00
{
2020-02-14 18:47:26 -07:00
size_t size = pointer ? sizeof ( void * ) : type - > byte_size ( ) ;
2020-03-06 18:28:14 -07:00
bool is_linked_list = type & & is_df_linked_list ( type ) ;
2020-02-09 13:16:19 -07:00
for ( size_t i = 0 ; i < count ; i + + , base = PTR_ADD ( base , size ) )
{
ToCheck item ( array , i , base , type ) ;
2020-02-09 14:12:25 -07:00
if ( ienum )
{
2020-02-29 13:18:27 -07:00
auto pname = get_enum_item_key ( ienum , int64_t ( i ) ) ;
auto name = pname ? * pname : nullptr ;
2020-02-09 14:12:25 -07:00
std : : ostringstream str ;
str < < " [ " < < ienum - > getFullName ( ) < < " :: " ;
if ( name )
{
str < < name ;
}
else
{
str < < " ? " < < i < < " ? " ;
}
str < < " ] " ;
item . path . back ( ) = str . str ( ) ;
}
2020-02-09 13:16:19 -07:00
if ( pointer )
{
item . temp_identity = std : : unique_ptr < pointer_identity > ( new pointer_identity ( type ) ) ;
item . identity = item . temp_identity . get ( ) ;
}
2020-03-06 18:28:14 -07:00
else if ( is_linked_list )
{
queue_df_linked_list ( item ) ;
continue ;
}
2020-02-15 11:54:04 -07:00
queue . push_back ( std : : move ( item ) ) ;
2020-02-09 13:16:19 -07:00
}
}
2020-02-29 17:28:14 -07:00
bool Checker : : maybe_queue_union ( const ToCheck & item , const struct_field_info * fields , const struct_field_info * union_field )
2020-02-20 21:17:25 -07:00
{
2020-02-29 13:18:27 -07:00
auto tag_field = find_union_tag ( fields , union_field ) ;
2020-03-04 17:23:49 -07:00
if ( ! tag_field )
return false ;
2020-02-29 17:28:14 -07:00
2020-03-04 17:23:49 -07:00
ToCheck union_item ( item , " . " + std : : string ( union_field - > name ) , PTR_ADD ( item . ptr , union_field - > offset ) , union_field - > type ) ;
ToCheck tag_item ( item , " . " + std : : string ( tag_field - > name ) , PTR_ADD ( item . ptr , tag_field - > offset ) , tag_field - > type ) ;
2020-02-29 17:28:14 -07:00
2020-03-04 17:23:49 -07:00
if ( union_field - > mode = = struct_field_info : : SUBSTRUCT )
queue_union ( union_item , tag_item ) ;
else
queue_union_vector ( union_item , tag_item ) ;
2020-02-29 17:28:14 -07:00
2020-03-04 17:23:49 -07:00
return true ;
2020-02-29 17:28:14 -07:00
}
2020-02-20 21:17:25 -07:00
2020-02-29 17:28:14 -07:00
void Checker : : queue_union ( const ToCheck & item , const ToCheck & tag_item )
{
auto union_type = static_cast < union_identity * > ( item . identity ) ;
auto tag_type = static_cast < enum_identity * > ( tag_item . identity ) ;
2020-02-20 21:17:25 -07:00
int64_t tag_value = check_enum ( tag_item ) ;
2020-02-29 13:18:27 -07:00
2020-02-29 17:28:14 -07:00
auto ptag_key = get_enum_item_key ( tag_type , tag_value ) ;
2020-02-29 13:18:27 -07:00
auto tag_key = ptag_key ? * ptag_key : nullptr ;
if ( ! ptag_key )
2020-02-20 21:17:25 -07:00
{
2020-02-29 17:28:14 -07:00
FAIL ( " tagged union tag ( " < < join_strings ( " " , tag_item . path ) < < " ) out of range ( " < < tag_value < < " ) " ) ;
2020-02-20 21:17:25 -07:00
}
2020-02-29 13:18:27 -07:00
else if ( ! tag_key )
2020-02-20 21:17:25 -07:00
{
2020-02-29 17:28:14 -07:00
FAIL ( " tagged union tag ( " < < join_strings ( " " , tag_item . path ) < < " ) unnamed ( " < < tag_value < < " ) " ) ;
2020-02-20 21:17:25 -07:00
}
2020-02-29 13:18:27 -07:00
const struct_field_info * item_field = nullptr ;
if ( tag_key )
2020-02-20 21:17:25 -07:00
{
2020-02-29 13:18:27 -07:00
for ( auto field = union_type - > getFields ( ) ; field - > mode ! = struct_field_info : : END ; field + + )
2020-02-20 21:17:25 -07:00
{
2020-02-29 13:18:27 -07:00
if ( ! strcmp ( tag_key , field - > name ) )
{
item_field = field ;
break ;
}
}
2020-02-20 21:17:25 -07:00
}
2020-02-29 13:18:27 -07:00
if ( item_field )
2020-02-20 21:17:25 -07:00
{
2020-02-29 13:18:27 -07:00
// good to go
2020-02-29 17:28:14 -07:00
ToCheck tagged_union_item ( item , " . " + std : : string ( item_field - > name ) , item . ptr , item_field - > type ) ;
2020-02-29 13:18:27 -07:00
queue_field ( std : : move ( tagged_union_item ) , item_field ) ;
return ;
2020-02-20 21:17:25 -07:00
}
2020-02-29 17:28:14 -07:00
// if it's all uninitialized, ignore it
2020-02-29 17:36:00 -07:00
uint8_t uninit_value = * reinterpret_cast < const uint8_t * > ( item . ptr ) ;
2020-02-29 20:57:39 -07:00
bool all_uninitialized = uninit_value = = 0x00 | | uninit_value = = 0xd2 | | uninit_value = = 0xff ;
2020-02-29 17:36:00 -07:00
if ( all_uninitialized )
2020-02-29 17:28:14 -07:00
{
2020-02-29 17:36:00 -07:00
for ( size_t offset = 0 ; offset < union_type - > byte_size ( ) ; offset + + )
2020-02-29 17:28:14 -07:00
{
2020-02-29 17:36:00 -07:00
if ( * reinterpret_cast < const uint8_t * > ( PTR_ADD ( item . ptr , offset ) ) ! = uninit_value )
{
all_uninitialized = false ;
break ;
}
2020-02-29 17:28:14 -07:00
}
}
if ( all_uninitialized )
{
return ;
}
// if we don't know the key, we already warned above
if ( tag_key )
{
FAIL ( " tagged union ( " < < join_strings ( " " , tag_item . path ) < < " ) missing member for tag " < < tag_key < < " ( " < < tag_value < < " ) " ) ;
}
2020-02-29 13:18:27 -07:00
// if there's a pointer (we only check the first field for now)
// assume this could also be a pointer
if ( union_type - > getFields ( ) - > mode = = struct_field_info : : POINTER )
{
2020-02-29 17:28:14 -07:00
ToCheck untagged_union_item ( item , tag_key ? " . " + std : : string ( tag_key ) : stl_sprintf ( " .?% " PRId64 " ? " , tag_value ) , item . ptr , df : : identity_traits < void * > : : get ( ) ) ;
2020-02-29 13:18:27 -07:00
queue . push_back ( std : : move ( untagged_union_item ) ) ;
}
2020-02-20 21:17:25 -07:00
}
2020-02-29 17:28:14 -07:00
void Checker : : queue_union_vector ( const ToCheck & item , const ToCheck & tag_item )
{
2020-03-06 15:50:09 -07:00
auto union_container_type = static_cast < container_identity * > ( item . identity ) ;
auto tag_container_type = static_cast < container_identity * > ( tag_item . identity ) ;
if ( tag_container_type - > getFullName ( nullptr ) = = " vector<bool> " )
2020-03-06 15:48:33 -07:00
{
queue_union_bitvector ( item , tag_item ) ;
return ;
}
2020-03-06 15:50:09 -07:00
auto union_type = static_cast < union_identity * > ( union_container_type - > getItemType ( ) ) ;
auto tag_type = static_cast < enum_identity * > ( tag_container_type - > getItemType ( ) ) ;
2020-02-29 17:28:14 -07:00
auto union_count = check_vector_size ( item , union_type - > byte_size ( ) ) ;
auto tag_count = check_vector_size ( tag_item , tag_type - > byte_size ( ) ) ;
if ( union_count ! = tag_count )
{
FAIL ( " tagged union vector size ( " < < union_count < < " ) does not match tag vector ( " < < join_strings ( " " , tag_item . path ) < < " ) size ( " < < tag_count < < " ) " ) ;
}
auto union_base = * reinterpret_cast < void * * > ( item . ptr ) ;
auto tag_base = * reinterpret_cast < void * * > ( tag_item . ptr ) ;
2020-02-29 23:18:09 -07:00
auto count = union_count < tag_count ? union_count : tag_count ;
2020-02-29 17:28:14 -07:00
for ( size_t i = 0 ; i < count ; i + + , union_base = PTR_ADD ( union_base , union_type - > byte_size ( ) ) , tag_base = PTR_ADD ( tag_base , tag_type - > byte_size ( ) ) )
{
ToCheck union_item ( item , i , union_base , union_type ) ;
ToCheck tag ( tag_item , i , tag_base , tag_type ) ;
queue_union ( union_item , tag ) ;
}
}
2020-03-06 15:48:33 -07:00
void Checker : : queue_union_bitvector ( const ToCheck & item , const ToCheck & tag_item )
{
auto union_type = static_cast < union_identity * > ( static_cast < container_identity * > ( item . identity ) - > getItemType ( ) ) ;
auto union_count = check_vector_size ( item , union_type - > byte_size ( ) ) ;
if ( ! check_bitvector ( tag_item ) )
{
return ;
}
auto tag_vector = reinterpret_cast < std : : vector < bool > * > ( tag_item . ptr ) ;
if ( union_count ! = tag_vector - > size ( ) )
{
2020-03-06 15:50:09 -07:00
FAIL ( " tagged union vector size ( " < < union_count < < " ) does not match tag vector ( " < < join_strings ( " " , tag_item . path ) < < " ) size ( " < < tag_vector - > size ( ) < < " ) " ) ;
2020-03-06 15:48:33 -07:00
}
auto union_base = * reinterpret_cast < void * * > ( item . ptr ) ;
auto count = union_count < tag_vector - > size ( ) ? union_count : tag_vector - > size ( ) ;
for ( size_t i = 0 ; i < count ; i + + , union_base = PTR_ADD ( union_base , union_type - > byte_size ( ) ) )
{
auto item_field = & union_type - > getFields ( ) [ tag_vector - > at ( i ) ? 1 : 0 ] ;
ToCheck tagged_union_item ( item , stl_sprintf ( " [%zu].%s " , i , item_field - > name ) , union_base , item_field - > type ) ;
queue_field ( std : : move ( tagged_union_item ) , item_field ) ;
}
}
2020-03-06 16:53:05 -07:00
void Checker : : queue_df_linked_list ( const ToCheck & item )
{
2020-03-06 18:28:14 -07:00
if ( ! is_df_linked_list ( item . identity ) )
2020-03-06 16:53:05 -07:00
{
UNEXPECTED ;
return ;
}
2020-03-06 18:28:14 -07:00
auto item_type = static_cast < struct_identity * > ( item . identity ) - > getFields ( ) [ 2 ] . type ;
2020-03-06 16:53:05 -07:00
int index = - 1 ;
2020-03-06 18:28:14 -07:00
struct df_linked_list_entry
{
2020-03-06 19:04:17 -07:00
void * item ;
2020-03-06 18:28:14 -07:00
df_linked_list_entry * prev ;
df_linked_list_entry * next ;
} * prev_ptr = nullptr , * cur_ptr = reinterpret_cast < df_linked_list_entry * > ( item . ptr ) ;
2020-03-06 16:53:05 -07:00
while ( cur_ptr )
{
2020-03-06 18:28:14 -07:00
if ( prev_ptr ! = cur_ptr - > prev )
2020-03-06 16:53:05 -07:00
{
2020-03-06 18:28:14 -07:00
FAIL ( " linked list element " < < index < < " previous element pointer " < < stl_sprintf ( " %p " , cur_ptr - > prev ) < < " does not match actual previous element " < < stl_sprintf ( " %p " , prev_ptr ) ) ;
2020-03-06 16:53:05 -07:00
return ;
}
2020-03-06 18:28:14 -07:00
auto item_ptr_ptr = reinterpret_cast < void * > ( & cur_ptr - > item ) ;
std : : unique_ptr < df : : pointer_identity > item_ptr_identity ( new df : : pointer_identity ( item_type ) ) ;
2020-03-06 16:53:05 -07:00
ToCheck item_item ( item , stl_sprintf ( " [%d].item " , index ) , item_ptr_ptr , item_ptr_identity . get ( ) ) ;
item_item . temp_identity = std : : move ( item_ptr_identity ) ;
queue . push_back ( std : : move ( item_item ) ) ;
2020-03-06 18:28:14 -07:00
auto next_ptr = reinterpret_cast < void * > ( cur_ptr - > next ) ;
2020-03-06 16:53:05 -07:00
ToCheck next_item ( item , stl_sprintf ( " [%d].next " , index ) , next_ptr , item . identity ) ;
if ( check_access ( next_item , next_ptr , item . identity ) )
{
prev_ptr = cur_ptr ;
2020-03-06 18:28:14 -07:00
cur_ptr = cur_ptr - > next ;
2020-03-06 16:53:05 -07:00
}
else
{
cur_ptr = nullptr ;
}
index + + ;
}
}
2020-02-29 13:18:27 -07:00
void Checker : : check_dispatch ( ToCheck & item )
2020-02-09 13:16:19 -07:00
{
2020-02-21 17:49:02 -07:00
if ( reinterpret_cast < uintptr_t > ( item . ptr ) = = UNINIT_PTR )
2020-02-05 15:36:59 -07:00
{
2020-02-21 17:49:02 -07:00
// allow uninitialized raw pointers
2020-02-05 15:36:59 -07:00
return ;
}
2020-02-21 17:49:02 -07:00
if ( ! item . identity )
2020-02-13 18:55:49 -07:00
{
2020-02-21 17:49:02 -07:00
// warn about bad pointers
2020-02-22 13:04:53 -07:00
if ( ! check_access ( item , item . ptr , df : : identity_traits < void * > : : get ( ) , 1 ) )
{
return ;
}
if ( sizes )
{
uint32_t tag = * reinterpret_cast < uint32_t * > ( PTR_ADD ( item . ptr , - 8 ) ) ;
if ( tag = = 0xdfdf4ac8 )
{
2020-02-22 13:10:26 -07:00
size_t allocated_size = * reinterpret_cast < size_t * > ( PTR_ADD ( item . ptr , - 16 ) ) ;
2020-02-22 13:04:53 -07:00
FAIL ( " pointer to a block of " < < allocated_size < < " bytes of allocated memory " ) ;
2020-02-29 13:18:27 -07:00
// check recursively if it might be a valid pointer
if ( allocated_size = = sizeof ( void * ) )
{
item . path . push_back ( " .?ptr? " ) ;
item . path . push_back ( " " ) ;
item . identity = df : : identity_traits < void * > : : get ( ) ;
}
2020-03-02 20:33:04 -07:00
else if ( allocated_size > = MIN_SIZE_FOR_SUGGEST & & known_types_by_size . count ( allocated_size ) )
{
FAIL ( " known types of this size: " < < join_strings ( " , " , known_types_by_size . at ( allocated_size ) ) ) ;
}
2020-02-22 13:04:53 -07:00
}
2020-02-22 14:34:48 -07:00
# ifndef WIN32
else if ( auto str = check_possible_stl_string_pointer ( & item . ptr ) )
{
FAIL ( " untyped pointer is actually stl-string with value \" " < < * str < < " \" (length " < < str - > length ( ) < < " ) " ) ;
}
# endif
2020-03-02 14:34:29 -07:00
else if ( auto vtable_name = check_vtable ( item , item . ptr , df : : identity_traits < void * > : : get ( ) ) )
{
FAIL ( " pointer to a vtable: " < < vtable_name ) ;
}
2020-02-22 14:34:48 -07:00
else
{
2020-02-23 20:33:32 -07:00
FAIL ( " pointer to memory with no size information " ) ;
2020-02-22 14:34:48 -07:00
}
2020-02-22 13:04:53 -07:00
}
2020-02-21 17:49:02 -07:00
2020-02-29 13:18:27 -07:00
// could have been set above
if ( ! item . identity )
{
return ;
}
2020-02-13 18:55:49 -07:00
}
2020-02-09 13:16:19 -07:00
if ( ! check_access ( item , item . ptr , item . identity ) & & item . identity - > type ( ) ! = IDTYPE_GLOBAL )
{
return ;
}
2020-02-29 14:08:39 -07:00
// special case for large_integer weirdness
if ( item . identity = = df : : identity_traits < df : : large_integer > : : get ( ) )
{
item . identity = df : : identity_traits < int64_t > : : get ( ) ;
}
2020-02-09 13:16:19 -07:00
switch ( item . identity - > type ( ) )
2020-02-05 15:36:59 -07:00
{
case IDTYPE_GLOBAL :
2020-02-09 13:16:19 -07:00
check_global ( item ) ;
2020-02-05 15:36:59 -07:00
break ;
case IDTYPE_FUNCTION :
2020-02-09 13:16:19 -07:00
// don't check functions
2020-02-05 15:36:59 -07:00
break ;
case IDTYPE_PRIMITIVE :
2020-02-09 13:16:19 -07:00
check_primitive ( item ) ;
2020-02-05 15:36:59 -07:00
break ;
case IDTYPE_POINTER :
2020-02-09 13:16:19 -07:00
check_pointer ( item ) ;
2020-02-05 15:36:59 -07:00
break ;
case IDTYPE_CONTAINER :
case IDTYPE_PTR_CONTAINER :
2020-02-09 13:16:19 -07:00
case IDTYPE_BIT_CONTAINER :
2020-02-05 15:36:59 -07:00
case IDTYPE_STL_PTR_VECTOR :
2020-02-09 13:16:19 -07:00
check_container ( item ) ;
break ;
case IDTYPE_BUFFER :
{
auto item_identity = static_cast < container_identity * > ( item . identity ) - > getItemType ( ) ;
2020-02-09 14:12:25 -07:00
auto ienum = static_cast < enum_identity * > ( static_cast < container_identity * > ( item . identity ) - > getIndexEnumType ( ) ) ;
queue_static_array ( item , item . ptr , item_identity , item . identity - > byte_size ( ) / item_identity - > byte_size ( ) , false , ienum ) ;
2020-02-09 13:16:19 -07:00
}
2020-02-05 15:36:59 -07:00
break ;
case IDTYPE_BITFIELD :
2020-02-09 13:16:19 -07:00
check_bitfield ( item ) ;
2020-02-05 15:36:59 -07:00
break ;
case IDTYPE_ENUM :
2020-02-09 13:16:19 -07:00
check_enum ( item ) ;
2020-02-05 15:36:59 -07:00
break ;
2020-02-29 12:11:23 -07:00
case IDTYPE_UNION :
2020-02-29 17:28:14 -07:00
FAIL ( " untagged union " ) ;
2020-02-29 13:18:27 -07:00
check_struct ( item ) ;
break ;
case IDTYPE_STRUCT :
2020-02-09 13:16:19 -07:00
check_struct ( item ) ;
2020-02-05 15:36:59 -07:00
break ;
case IDTYPE_CLASS :
2020-02-09 13:16:19 -07:00
check_virtual ( item ) ;
2020-02-05 15:36:59 -07:00
break ;
case IDTYPE_OPAQUE :
2020-02-09 13:16:19 -07:00
// can't check opaque
2020-02-05 15:36:59 -07:00
break ;
}
}
2020-02-09 13:16:19 -07:00
void Checker : : check_global ( const ToCheck & globals )
2020-02-05 15:36:59 -07:00
{
2020-02-09 13:16:19 -07:00
auto identity = static_cast < global_identity * > ( globals . identity ) ;
for ( auto field = identity - > getFields ( ) ; field - > mode ! = struct_field_info : : END ; field + + )
2020-02-05 15:36:59 -07:00
{
2020-02-09 13:16:19 -07:00
ToCheck item ( globals , field - > name , nullptr , field - > type ) ;
2020-02-21 16:31:22 -07:00
item . path . push_back ( " " ) ; // tell check_struct that this is a pointer
2020-02-09 13:16:19 -07:00
auto base = reinterpret_cast < void * * > ( field - > offset ) ;
if ( ! check_access ( item , base , df : : identity_traits < void * > : : get ( ) ) )
{
continue ;
}
item . ptr = * base ;
if ( ! seen_addr . insert ( item . ptr ) . second )
{
continue ;
}
queue_field ( std : : move ( item ) , field ) ;
2020-02-05 15:36:59 -07:00
}
2020-02-09 13:16:19 -07:00
}
2020-02-05 15:36:59 -07:00
2020-02-09 13:16:19 -07:00
void Checker : : check_primitive ( const ToCheck & item )
{
if ( item . identity - > getFullName ( ) = = " string " )
2020-02-05 15:36:59 -07:00
{
2020-02-09 13:16:19 -07:00
check_stl_string ( item ) ;
2020-02-05 15:36:59 -07:00
return ;
}
2020-02-22 13:04:53 -07:00
if ( item . identity - > getFullName ( ) = = " bool " )
{
auto value = * reinterpret_cast < uint8_t * > ( item . ptr ) ;
if ( value > 1 & & value ! = 0xd2 )
{
FAIL ( " invalid boolean value " < < stl_sprintf ( " %d (0x%02x) " , value , value ) ) ;
}
return ;
}
2020-02-09 13:16:19 -07:00
// TODO: check other primitives?
}
void Checker : : check_stl_string ( const ToCheck & item )
{
if ( ! seen_addr . insert ( item . ptr ) . second )
2020-02-05 17:24:10 -07:00
{
return ;
}
2020-02-09 13:16:19 -07:00
if ( ! check_access ( item , item . ptr , item . identity ) )
2020-02-05 15:36:59 -07:00
{
return ;
}
2020-02-09 13:16:19 -07:00
# ifdef WIN32
struct string_data
2020-02-05 15:36:59 -07:00
{
2020-02-09 13:16:19 -07:00
union
{
uintptr_t start ;
char local_data [ 16 ] ;
} ;
size_t length ;
size_t capacity ;
} ;
# else
struct string_data
{
struct string_data_inner
{
size_t length ;
size_t capacity ;
2020-02-21 16:31:22 -07:00
int32_t refcount ;
2020-02-09 13:16:19 -07:00
} * ptr ;
} ;
# endif
2020-02-05 15:36:59 -07:00
2020-02-09 13:16:19 -07:00
if ( item . identity - > byte_size ( ) ! = sizeof ( string_data ) )
{
UNEXPECTED ;
return ;
2020-02-05 15:36:59 -07:00
}
2020-02-09 13:16:19 -07:00
auto string = reinterpret_cast < string_data * > ( item . ptr ) ;
# ifdef WIN32
bool is_local = string - > capacity < 16 ;
char * start = is_local ? & string - > local_data [ 0 ] : reinterpret_cast < char * > ( string - > start ) ;
ptrdiff_t length = string - > length ;
ptrdiff_t capacity = string - > capacity ;
# else
if ( ! check_access ( item , string - > ptr , item . identity , 1 ) )
2020-02-05 15:36:59 -07:00
{
2020-02-21 14:07:48 -07:00
// nullptr is NOT okay here
2020-02-21 16:31:22 -07:00
FAIL ( " invalid string pointer " < < stl_sprintf ( " %p " , string - > ptr ) ) ;
2020-02-05 15:36:59 -07:00
return ;
}
2020-02-09 13:16:19 -07:00
if ( ! check_access ( item , string - > ptr - 1 , item . identity , sizeof ( * string - > ptr ) ) )
2020-02-05 15:36:59 -07:00
{
return ;
}
2020-02-09 13:16:19 -07:00
char * start = reinterpret_cast < char * > ( string - > ptr ) ;
ptrdiff_t length = ( string - > ptr - 1 ) - > length ;
ptrdiff_t capacity = ( string - > ptr - 1 ) - > capacity ;
# endif
if ( length < 0 )
{
FAIL ( " string length is negative ( " < < length < < " ) " ) ;
}
2020-02-21 16:31:22 -07:00
else if ( capacity < 0 )
2020-02-09 13:16:19 -07:00
{
FAIL ( " string capacity is negative ( " < < capacity < < " ) " ) ;
}
else if ( capacity < length )
{
FAIL ( " string capacity ( " < < capacity < < " ) is less than length ( " < < length < < " ) " ) ;
}
2020-02-21 16:31:22 -07:00
# ifndef WIN32
const std : : string empty_string ;
auto empty_string_data = reinterpret_cast < const string_data * > ( & empty_string ) ;
if ( sizes & & string - > ptr ! = empty_string_data - > ptr )
{
uint32_t tag = * reinterpret_cast < uint32_t * > ( PTR_ADD ( string - > ptr - 1 , - 8 ) ) ;
if ( tag = = 0xdfdf4ac8 )
{
size_t allocated_size = * reinterpret_cast < size_t * > ( PTR_ADD ( string - > ptr - 1 , - 16 ) ) ;
size_t expected_size = sizeof ( * string - > ptr ) + capacity + 1 ;
if ( allocated_size ! = expected_size )
{
FAIL ( " allocated string data size ( " < < allocated_size < < " ) does not match expected size ( " < < expected_size < < " ) " ) ;
}
}
2020-02-23 20:33:32 -07:00
else
2020-02-21 16:31:22 -07:00
{
2020-03-02 21:30:23 -07:00
FAIL ( " pointer does not appear to be a string " ) ;
//UNEXPECTED;
2020-02-21 16:31:22 -07:00
}
}
# endif
2020-02-09 13:16:19 -07:00
check_access ( item , start , item . identity , capacity ) ;
}
2020-02-05 15:36:59 -07:00
2020-02-09 13:16:19 -07:00
void Checker : : check_pointer ( const ToCheck & item )
{
2020-02-21 16:31:22 -07:00
if ( ! seen_addr . insert ( item . ptr ) . second )
2020-02-05 15:36:59 -07:00
{
return ;
}
2020-02-21 16:31:22 -07:00
auto base = * reinterpret_cast < void * * > ( item . ptr ) ;
auto base_int = uintptr_t ( base ) ;
if ( base_int ! = UNINIT_PTR & & base_int % alignof ( void * ) ! = 0 )
2020-02-05 15:36:59 -07:00
{
2020-02-21 16:31:22 -07:00
FAIL ( " unaligned pointer " < < stl_sprintf ( " %p " , base ) ) ;
2020-02-05 15:36:59 -07:00
}
2020-02-09 13:16:19 -07:00
2020-02-21 16:31:22 -07:00
auto target_identity = static_cast < pointer_identity * > ( item . identity ) - > getTarget ( ) ;
queue . push_back ( ToCheck ( item , " " , base , target_identity ) ) ;
2020-02-09 13:16:19 -07:00
}
void Checker : : check_bitfield ( const ToCheck & item )
{
2020-02-14 18:47:26 -07:00
if ( ! enums )
{
return ;
}
auto identity = static_cast < bitfield_identity * > ( item . identity ) ;
uint64_t val = 0 ;
for ( size_t offset = 0 ; offset < identity - > byte_size ( ) ; offset + + )
{
val | = uint64_t ( * reinterpret_cast < uint8_t * > ( PTR_ADD ( item . ptr , offset ) ) ) < < ( 8 * offset ) ;
}
size_t num_bits = identity - > getNumBits ( ) ;
auto bits = identity - > getBits ( ) ;
for ( size_t i = 0 ; i < num_bits ; i + + )
{
if ( bits [ i ] . size < 0 )
continue ;
if ( bits [ i ] . name )
continue ;
2020-02-15 17:18:30 -07:00
if ( ! ( val & ( 1ULL < < i ) ) )
2020-02-14 18:47:26 -07:00
continue ;
if ( bits [ i ] . size )
{
FAIL ( " bitfield bit " < < i < < " is unnamed " ) ;
}
else
{
FAIL ( " bitfield bit " < < i < < " past the defined end of the bitfield " ) ;
}
}
2020-02-09 13:16:19 -07:00
}
2020-02-20 21:17:25 -07:00
int64_t Checker : : check_enum ( const ToCheck & item )
2020-02-09 13:16:19 -07:00
{
2020-02-14 18:47:26 -07:00
auto identity = static_cast < enum_identity * > ( item . identity ) ;
int64_t value ;
switch ( identity - > byte_size ( ) )
{
case 1 :
if ( identity - > getFirstItem ( ) < 0 )
value = * reinterpret_cast < int8_t * > ( item . ptr ) ;
else
value = * reinterpret_cast < uint8_t * > ( item . ptr ) ;
break ;
case 2 :
if ( identity - > getFirstItem ( ) < 0 )
value = * reinterpret_cast < int16_t * > ( item . ptr ) ;
else
value = * reinterpret_cast < uint16_t * > ( item . ptr ) ;
break ;
case 4 :
if ( identity - > getFirstItem ( ) < 0 )
value = * reinterpret_cast < int32_t * > ( item . ptr ) ;
else
value = * reinterpret_cast < uint32_t * > ( item . ptr ) ;
break ;
case 8 :
value = * reinterpret_cast < int64_t * > ( item . ptr ) ;
break ;
default :
UNEXPECTED ;
2020-02-20 21:17:25 -07:00
return - 1 ;
}
if ( ! enums )
{
return value ;
2020-02-14 18:47:26 -07:00
}
2020-02-29 13:18:27 -07:00
auto key = get_enum_item_key ( identity , value ) ;
if ( ! key )
2020-02-14 18:47:26 -07:00
{
2020-02-29 13:18:27 -07:00
if ( identity - > getComplex ( ) )
2020-02-14 18:47:26 -07:00
{
FAIL ( " enum value ( " < < value < < " ) is not defined (complex enum) " ) ;
}
2020-02-29 13:18:27 -07:00
else
2020-02-14 18:47:26 -07:00
{
FAIL ( " enum value ( " < < value < < " ) outside of defined range ( " < < identity - > getFirstItem ( ) < < " to " < < identity - > getLastItem ( ) < < " ) " ) ;
}
}
2020-02-29 13:18:27 -07:00
else if ( ! * key )
2020-02-14 18:47:26 -07:00
{
FAIL ( " enum value ( " < < value < < " ) is unnamed " ) ;
}
2020-02-20 21:17:25 -07:00
return value ;
2020-02-09 13:16:19 -07:00
}
void Checker : : check_container ( const ToCheck & item )
{
auto identity = static_cast < container_identity * > ( item . identity ) ;
if ( ! seen_addr . insert ( item . ptr ) . second )
2020-02-05 15:36:59 -07:00
{
return ;
}
auto void_name = identity - > getFullName ( nullptr ) ;
2020-02-09 13:16:19 -07:00
if ( void_name = = " vector<void> " )
{
check_vector ( item , identity - > getItemType ( ) , false ) ;
}
else if ( void_name = = " vector<void*> " )
2020-02-05 15:36:59 -07:00
{
2020-02-09 13:16:19 -07:00
check_vector ( item , identity - > getItemType ( ) , true ) ;
2020-02-05 15:36:59 -07:00
}
else if ( void_name = = " deque<void> " )
{
2020-02-09 13:16:19 -07:00
check_deque ( item , identity - > getItemType ( ) ) ;
2020-02-05 15:36:59 -07:00
}
2020-02-05 18:06:14 -07:00
else if ( void_name = = " DfArray<void> " )
{
2020-02-09 13:16:19 -07:00
check_dfarray ( item , identity - > getItemType ( ) ) ;
}
else if ( void_name = = " BitArray<> " )
{
check_bitarray ( item ) ;
}
else if ( void_name = = " vector<bool> " )
{
check_bitvector ( item ) ;
2020-02-05 18:06:14 -07:00
}
2020-02-05 15:36:59 -07:00
else
{
FAIL ( " TODO: " < < void_name ) ;
UNEXPECTED ;
}
}
2020-02-29 17:28:14 -07:00
size_t Checker : : check_vector_size ( const ToCheck & item , size_t item_size )
2020-02-05 15:36:59 -07:00
{
struct vector_data
{
uintptr_t start ;
uintptr_t finish ;
uintptr_t end_of_storage ;
} ;
2020-02-09 13:16:19 -07:00
if ( item . identity - > byte_size ( ) ! = sizeof ( vector_data ) )
2020-02-05 15:36:59 -07:00
{
UNEXPECTED ;
2020-02-29 17:28:14 -07:00
return 0 ;
2020-02-05 15:36:59 -07:00
}
2020-02-09 13:16:19 -07:00
vector_data vector = * reinterpret_cast < vector_data * > ( item . ptr ) ;
2020-02-05 15:36:59 -07:00
ptrdiff_t length = vector . finish - vector . start ;
ptrdiff_t capacity = vector . end_of_storage - vector . start ;
bool local_ok = true ;
if ( vector . start > vector . finish )
{
local_ok = false ;
2020-02-05 19:21:32 -07:00
FAIL ( " vector length is negative ( " < < ( length / ptrdiff_t ( item_size ) ) < < " ) " ) ;
2020-02-05 15:36:59 -07:00
}
if ( vector . start > vector . end_of_storage )
{
local_ok = false ;
2020-02-05 19:21:32 -07:00
FAIL ( " vector capacity is negative ( " < < ( capacity / ptrdiff_t ( item_size ) ) < < " ) " ) ;
2020-02-05 15:36:59 -07:00
}
else if ( vector . finish > vector . end_of_storage )
{
local_ok = false ;
2020-02-05 19:21:32 -07:00
FAIL ( " vector capacity ( " < < ( capacity / ptrdiff_t ( item_size ) ) < < " ) is less than its length ( " < < ( length / ptrdiff_t ( item_size ) ) < < " ) " ) ;
2020-02-05 15:36:59 -07:00
}
2020-02-29 17:28:14 -07:00
if ( ! item_size )
2020-02-09 13:25:48 -07:00
{
2020-02-29 17:28:14 -07:00
return 0 ;
2020-02-09 13:25:48 -07:00
}
2020-02-05 15:36:59 -07:00
size_t ulength = size_t ( length ) ;
size_t ucapacity = size_t ( capacity ) ;
if ( ulength % item_size ! = 0 )
{
local_ok = false ;
FAIL ( " vector length is non-integer ( " < < ( ulength / item_size ) < < " items plus " < < ( ulength % item_size ) < < " bytes) " ) ;
}
if ( ucapacity % item_size ! = 0 )
{
local_ok = false ;
FAIL ( " vector capacity is non-integer ( " < < ( ucapacity / item_size ) < < " items plus " < < ( ucapacity % item_size ) < < " bytes) " ) ;
}
2020-02-29 17:28:14 -07:00
if ( local_ok & & capacity & & ! vector . start )
2020-02-11 16:17:11 -07:00
{
2020-02-29 17:28:14 -07:00
FAIL ( " vector has null pointer but capacity " < < ( capacity / item_size ) ) ;
return 0 ;
2020-02-11 16:17:11 -07:00
}
2020-02-29 17:28:14 -07:00
if ( ! check_access ( item , reinterpret_cast < void * > ( vector . start ) , item . identity , capacity ) )
2020-02-05 15:36:59 -07:00
{
2020-02-29 17:28:14 -07:00
return 0 ;
}
return local_ok ? ulength / item_size : 0 ;
}
void Checker : : check_vector ( const ToCheck & item , type_identity * item_identity , bool pointer )
{
size_t item_size = pointer ? sizeof ( void * ) : item_identity - > byte_size ( ) ;
if ( ! item_identity & & pointer & & ! sizes )
{
// non-identified vector type in structures
item_size = 0 ;
2020-02-05 15:36:59 -07:00
}
2020-02-29 17:28:14 -07:00
size_t count = check_vector_size ( item , item_size ) ;
if ( item . path . back ( ) = = " .bad " | | count = = 0 )
2020-02-21 16:31:22 -07:00
{
2020-02-29 17:28:14 -07:00
// don't check contents
return ;
2020-02-21 16:31:22 -07:00
}
2020-02-29 17:28:14 -07:00
void * start = * reinterpret_cast < void * * > ( item . ptr ) ;
auto ienum = static_cast < enum_identity * > ( static_cast < container_identity * > ( item . identity ) - > getIndexEnumType ( ) ) ;
queue_static_array ( item , start , item_identity , count , pointer , ienum ) ;
2020-02-05 15:36:59 -07:00
}
2020-02-09 13:16:19 -07:00
void Checker : : check_deque ( const ToCheck & item , type_identity * item_identity )
2020-02-05 15:36:59 -07:00
{
// TODO: check deque?
}
2020-02-09 13:16:19 -07:00
void Checker : : check_dfarray ( const ToCheck & item , type_identity * item_identity )
2020-02-05 18:06:14 -07:00
{
struct dfarray_data
{
uintptr_t start ;
unsigned short size ;
} ;
2020-02-09 13:16:19 -07:00
if ( item . identity - > byte_size ( ) ! = sizeof ( dfarray_data ) )
2020-02-05 18:06:14 -07:00
{
UNEXPECTED ;
return ;
}
2020-02-09 13:16:19 -07:00
dfarray_data dfarray = * reinterpret_cast < dfarray_data * > ( item . ptr ) ;
2020-02-05 18:06:14 -07:00
size_t length = dfarray . size ;
size_t item_size = item_identity - > byte_size ( ) ;
2020-02-09 13:16:19 -07:00
if ( check_access ( item , reinterpret_cast < void * > ( dfarray . start ) , item . identity , item_size * length ) )
2020-02-05 18:06:14 -07:00
{
2020-02-09 14:12:25 -07:00
auto ienum = static_cast < enum_identity * > ( static_cast < container_identity * > ( item . identity ) - > getIndexEnumType ( ) ) ;
queue_static_array ( item , reinterpret_cast < void * > ( dfarray . start ) , item_identity , length , false , ienum ) ;
2020-02-05 18:06:14 -07:00
}
}
2020-02-09 13:16:19 -07:00
void Checker : : check_bitarray ( const ToCheck & item )
2020-02-05 15:36:59 -07:00
{
2020-02-09 13:16:19 -07:00
// TODO: check DFHack::BitArray?
}
2020-02-05 15:36:59 -07:00
2020-03-06 15:48:33 -07:00
bool Checker : : check_bitvector ( const ToCheck & item )
2020-02-09 13:16:19 -07:00
{
2020-02-05 15:36:59 -07:00
struct biterator_data
{
uintptr_t ptr ;
unsigned int offset ;
} ;
struct bvector_data
{
biterator_data start ;
biterator_data finish ;
uintptr_t end_of_storage ;
} ;
2020-02-09 13:16:19 -07:00
if ( item . identity - > byte_size ( ) ! = sizeof ( bvector_data ) )
2020-02-05 15:36:59 -07:00
{
UNEXPECTED ;
2020-03-06 15:48:33 -07:00
return false ;
2020-02-05 15:36:59 -07:00
}
// TODO: check vector<bool>?
2020-03-06 15:48:33 -07:00
return true ;
2020-02-05 15:36:59 -07:00
}
2020-02-09 13:16:19 -07:00
void Checker : : check_struct ( const ToCheck & item )
2020-02-05 15:36:59 -07:00
{
2020-02-14 18:47:26 -07:00
bool is_pointer = item . path . back ( ) . empty ( ) ;
bool is_virtual = ! item . path . back ( ) . empty ( ) & & item . path . back ( ) . at ( 0 ) = = ' < ' ;
2020-02-21 16:31:22 -07:00
bool is_virtual_pointer = is_virtual & & item . path . size ( ) > = 2 & & item . path . at ( item . path . size ( ) - 2 ) . empty ( ) ;
if ( sizes & & uintptr_t ( item . ptr ) % 32 = = 16 & & ( is_pointer | | is_virtual_pointer ) )
2020-02-14 18:47:26 -07:00
{
uint32_t tag = * reinterpret_cast < uint32_t * > ( PTR_ADD ( item . ptr , - 8 ) ) ;
if ( tag = = 0xdfdf4ac8 )
{
size_t allocated_size = * reinterpret_cast < size_t * > ( PTR_ADD ( item . ptr , - 16 ) ) ;
size_t expected_size = item . identity - > byte_size ( ) ;
if ( allocated_size ! = expected_size )
{
FAIL ( " allocated structure size ( " < < allocated_size < < " ) does not match expected size ( " < < expected_size < < " ) " ) ;
}
}
2020-02-23 20:33:32 -07:00
else
2020-02-21 16:31:22 -07:00
{
2020-03-02 21:30:23 -07:00
FAIL ( " unknown allocation size; possibly bad " ) ;
//UNEXPECTED;
2020-02-21 16:31:22 -07:00
}
2020-02-14 18:47:26 -07:00
}
2020-02-12 17:01:49 -07:00
for ( auto identity = static_cast < struct_identity * > ( item . identity ) ; identity ; identity = identity - > getParent ( ) )
2020-02-05 15:36:59 -07:00
{
2020-02-12 17:01:49 -07:00
auto fields = identity - > getFields ( ) ;
if ( ! fields )
{
continue ;
}
for ( auto field = fields ; field - > mode ! = struct_field_info : : END ; field + + )
{
2020-02-29 17:28:14 -07:00
if ( maybe_queue_union ( item , fields , field ) )
2020-02-20 21:17:25 -07:00
{
continue ;
}
2020-03-06 18:28:14 -07:00
if ( field - > mode = = struct_field_info : : POINTER & & is_df_linked_list ( field - > type ) )
2020-03-06 16:53:05 -07:00
{
// skip linked list pointers
continue ;
}
2020-02-12 17:01:49 -07:00
ToCheck child ( item , std : : string ( " . " ) + field - > name , PTR_ADD ( item . ptr , field - > offset ) , field - > type ) ;
2020-02-05 15:36:59 -07:00
2020-02-12 17:01:49 -07:00
queue_field ( std : : move ( child ) , field ) ;
}
2020-02-05 17:24:10 -07:00
}
2020-02-05 15:36:59 -07:00
}
2020-02-05 17:24:10 -07:00
2020-02-09 13:16:19 -07:00
void Checker : : check_virtual ( const ToCheck & item )
2020-02-05 17:24:10 -07:00
{
2020-02-09 13:16:19 -07:00
if ( ! seen_addr . insert ( item . ptr ) . second )
2020-02-05 17:24:10 -07:00
{
return ;
}
2020-02-09 13:16:19 -07:00
if ( ! check_access ( item , item . ptr , item . identity ) )
2020-02-05 17:24:10 -07:00
{
return ;
}
2020-02-09 13:16:19 -07:00
auto identity = static_cast < virtual_identity * > ( item . identity ) ;
2020-02-05 17:24:10 -07:00
2020-02-09 13:16:19 -07:00
void * vtable = * reinterpret_cast < void * * > ( item . ptr ) ;
if ( ! check_vtable ( item , vtable , identity ) )
2020-02-05 17:24:10 -07:00
{
2020-02-09 13:16:19 -07:00
FAIL ( " invalid vtable pointer " ) ;
2020-02-05 17:24:10 -07:00
return ;
}
2020-02-09 13:16:19 -07:00
else if ( ! identity - > is_instance ( reinterpret_cast < virtual_ptr > ( item . ptr ) ) )
2020-02-05 17:24:10 -07:00
{
2020-02-09 13:16:19 -07:00
auto class_name = Core : : getInstance ( ) . p - > readClassName ( vtable ) ;
FAIL ( " vtable is not a known subclass (subclass is " < < class_name < < " ) " ) ;
2020-02-05 17:24:10 -07:00
return ;
}
2020-02-14 18:47:26 -07:00
auto vident = virtual_identity : : get ( reinterpret_cast < virtual_ptr > ( item . ptr ) ) ;
ToCheck virtual_item ( item , " < " + vident - > getFullName ( ) + " > " , item . ptr , vident ) ;
2020-02-12 16:57:55 -07:00
check_struct ( virtual_item ) ;
2020-02-05 17:24:10 -07:00
}