/*************************************************************************** Interface between g++ and Boehm GC Copyright (c) 1991-1995 by Xerox Corporation. All rights reserved. THIS MATERIAL IS PROVIDED AS IS, WITH ABSOLUTELY NO WARRANTY EXPRESSED OR IMPLIED. ANY USE IS AT YOUR OWN RISK. Permission is hereby granted to copy this code for any purpose, provided the above notices are retained on all copies. Last modified on Sun Jul 16 23:21:14 PDT 1995 by ellis This module provides runtime support for implementing the Ellis/Detlefs GC proposal, "Safe, Efficient Garbage Collection for C++", within g++, using its -fgc-keyword extension. It defines versions of __builtin_new, __builtin_new_gc, __builtin_vec_new, __builtin_vec_new_gc, __builtin_delete, and __builtin_vec_delete that invoke the Bohem GC. It also implements the WeakPointer.h interface. This module assumes the following configuration options of the Boehm GC: -DALL_INTERIOR_POINTERS -DDONT_ADD_BYTE_AT_END This module adds its own required padding to the end of objects to support C/C++ "one-past-the-object" pointer semantics. ****************************************************************************/ #include #include "gc.h" #if defined(__STDC__) # define PROTO( args ) args #else # define PROTO( args ) () # endif #define BITSPERBYTE 8 /* What's the portable way to do this? */ typedef void (*vfp) PROTO(( void )); extern vfp __new_handler; extern void __default_new_handler PROTO(( void )); /* A destructor_proc is the compiler generated procedure representing a C++ destructor. The "flag" argument is a hidden argument following some compiler convention. */ typedef (*destructor_proc) PROTO(( void* this, int flag )); /*************************************************************************** A BI_header is the header the compiler adds to the front of new-allocated arrays of objects with destructors. The header is padded out to a double, because that's what the compiler does to ensure proper alignment of array elements on some architectures. int NUM_ARRAY_ELEMENTS (void* o) returns the number of array elements for array object o. char* FIRST_ELEMENT_P (void* o) returns the address of the first element of array object o. ***************************************************************************/ typedef struct BI_header { int nelts; char padding [sizeof( double ) - sizeof( int )]; /* Better way to do this? */ } BI_header; #define NUM_ARRAY_ELEMENTS( o ) \ (((BI_header*) o)->nelts) #define FIRST_ELEMENT_P( o ) \ ((char*) o + sizeof( BI_header )) /*************************************************************************** The __builtin_new routines add a descriptor word to the end of each object. The descriptor serves two purposes. First, the descriptor acts as padding, implementing C/C++ pointer semantics. C and C++ allow a valid array pointer to be incremented one past the end of an object. The extra padding ensures that the collector will recognize that such a pointer points to the object and not the next object in memory. Second, the descriptor stores three extra pieces of information, whether an object has a registered finalizer (destructor), whether it may have any weak pointers referencing it, and for collectible arrays, the element size of the array. The element size is required for the array's finalizer to iterate through the elements of the array. (An alternative design would have the compiler generate a finalizer procedure for each different array type. But given the overhead of finalization, there isn't any efficiency to be gained by that.) The descriptor must be added to non-collectible as well as collectible objects, since the Ellis/Detlefs proposal allows "pointer to gc T" to be assigned to a "pointer to T", which could then be deleted. Thus, __builtin_delete must determine at runtime whether an object is collectible, whether it has weak pointers referencing it, and whether it may have a finalizer that needs unregistering. Though GC_REGISTER_FINALIZER doesn't care if you ask it to unregister a finalizer for an object that doesn't have one, it is a non-trivial procedure that does a hash look-up, etc. The descriptor trades a little extra space for a significant increase in time on the fast path through delete. (A similar argument applies to GC_UNREGISTER_DISAPPEARING_LINK). For non-array types, the space for the descriptor could be shrunk to a single byte for storing the "has finalizer" flag. But this would save space only on arrays of char (whose size is not a multiple of the word size) and structs whose largest member is less than a word in size (very infrequent). And it would require that programmers actually remember to call "delete[]" instead of "delete" (which they should, but there are probably lots of buggy programs out there). For the moment, the space savings seems not worthwhile, especially considering that the Boehm GC is already quite space competitive with other malloc's. Given a pointer o to the base of an object: Descriptor* DESCRIPTOR (void* o) returns a pointer to the descriptor for o. The implementation of descriptors relies on the fact that the GC implementation allocates objects in units of the machine's natural word size (e.g. 32 bits on a SPARC, 64 bits on an Alpha). **************************************************************************/ typedef struct Descriptor { unsigned has_weak_pointers: 1; unsigned has_finalizer: 1; unsigned element_size: BITSPERBYTE * sizeof( unsigned ) - 2; } Descriptor; #define DESCRIPTOR( o ) \ ((Descriptor*) ((char*)(o) + GC_size( o ) - sizeof( Descriptor ))) /************************************************************************** Implementations of global operator new() and operator delete() ***************************************************************************/ void* __builtin_new( size ) size_t size; /* For non-gc non-array types, the compiler generates calls to __builtin_new, which allocates non-collected storage via GC_MALLOC_UNCOLLECTABLE. This ensures that the non-collected storage will be part of the collector's root set, required by the Ellis/Detlefs semantics. */ { vfp handler = __new_handler ? __new_handler : __default_new_handler; while (1) { void* o = GC_MALLOC_UNCOLLECTABLE( size + sizeof( Descriptor ) ); if (o != 0) return o; (*handler) ();}} void* __builtin_vec_new( size ) size_t size; /* For non-gc array types, the compiler generates calls to __builtin_vec_new. */ { return __builtin_new( size );} void* __builtin_new_gc( size ) size_t size; /* For gc non-array types, the compiler generates calls to __builtin_new_gc, which allocates collected storage via GC_MALLOC. */ { vfp handler = __new_handler ? __new_handler : __default_new_handler; while (1) { void* o = GC_MALLOC( size + sizeof( Descriptor ) ); if (o != 0) return o; (*handler) ();}} void* __builtin_new_gc_a( size ) size_t size; /* For non-pointer-containing gc non-array types, the compiler generates calls to __builtin_new_gc_a, which allocates collected storage via GC_MALLOC_ATOMIC. */ { vfp handler = __new_handler ? __new_handler : __default_new_handler; while (1) { void* o = GC_MALLOC_ATOMIC( size + sizeof( Descriptor ) ); if (o != 0) return o; (*handler) ();}} void* __builtin_vec_new_gc( size ) size_t size; /* For gc array types, the compiler generates calls to __builtin_vec_new_gc. */ { return __builtin_new_gc( size );} void* __builtin_vec_new_gc_a( size ) size_t size; /* For non-pointer-containing gc array types, the compiler generates calls to __builtin_vec_new_gc_a. */ { return __builtin_new_gc_a( size );} static void call_destructor( o, data ) void* o; void* data; /* call_destructor is the GC finalizer proc registered for non-array gc objects with destructors. Its client data is the destructor proc, which it calls with the magic integer 2, a special flag obeying the compiler convention for destructors. */ { ((destructor_proc) data)( o, 2 );} void* __builtin_new_gc_dtor( o, d ) void* o; destructor_proc d; /* The compiler generates a call to __builtin_new_gc_dtor to register the destructor "d" of a non-array gc object "o" as a GC finalizer. The destructor is registered via GC_REGISTER_FINALIZER_IGNORE_SELF, which causes the collector to ignore pointers from the object to itself when determining when the object can be finalized. This is necessary due to the self pointers used in the internal representation of multiply-inherited objects. */ { Descriptor* desc = DESCRIPTOR( o ); GC_REGISTER_FINALIZER_IGNORE_SELF( o, call_destructor, d, 0, 0 ); desc->has_finalizer = 1;} static void call_array_destructor( o, data ) void* o; void* data; /* call_array_destructor is the GC finalizer proc registered for gc array objects whose elements have destructors. Its client data is the destructor proc. It iterates through the elements of the array in reverse order, calling the destructor on each. */ { int num = NUM_ARRAY_ELEMENTS( o ); Descriptor* desc = DESCRIPTOR( o ); size_t size = desc->element_size; char* first_p = FIRST_ELEMENT_P( o ); char* p = first_p + (num - 1) * size; if (num > 0) { while (1) { ((destructor_proc) data)( p, 2 ); if (p == first_p) break; p -= size;}}} void* __builtin_vec_new_gc_dtor( first_elem, d, element_size ) void* first_elem; destructor_proc d; size_t element_size; /* The compiler generates a call to __builtin_vec_new_gc_dtor to register the destructor "d" of a gc array object as a GC finalizer. "first_elem" points to the first element of the array, *not* the beginning of the object (this makes the generated call to this function smaller). The elements of the array are of size "element_size". The destructor is registered as in _builtin_new_gc_dtor. */ { void* o = (char*) first_elem - sizeof( BI_header ); Descriptor* desc = DESCRIPTOR( o ); GC_REGISTER_FINALIZER_IGNORE_SELF( o, call_array_destructor, d, 0, 0 ); desc->element_size = element_size; desc->has_finalizer = 1;} void __builtin_delete( o ) void* o; /* The compiler generates calls to __builtin_delete for operator delete(). The GC currently requires that any registered finalizers be unregistered before explicitly freeing an object. If the object has any weak pointers referencing it, we can't actually free it now. */ { if (o != 0) { Descriptor* desc = DESCRIPTOR( o ); if (desc->has_finalizer) GC_REGISTER_FINALIZER( o, 0, 0, 0, 0 ); if (! desc->has_weak_pointers) GC_FREE( o );}} void __builtin_vec_delete( o ) void* o; /* The compiler generates calls to __builitn_vec_delete for operator delete[](). */ { __builtin_delete( o );} /************************************************************************** Implementations of the template class WeakPointer from WeakPointer.h ***************************************************************************/ typedef struct WeakPointer { void* pointer; } WeakPointer; void* _WeakPointer_New( t ) void* t; { if (t == 0) { return 0;} else { void* base = GC_base( t ); WeakPointer* wp = (WeakPointer*) GC_MALLOC_ATOMIC( sizeof( WeakPointer ) ); Descriptor* desc = DESCRIPTOR( base ); wp->pointer = t; desc->has_weak_pointers = 1; GC_general_register_disappearing_link( &wp->pointer, base ); return wp;}} static void* PointerWithLock( wp ) WeakPointer* wp; { if (wp == 0 || wp->pointer == 0) { return 0;} else { return (void*) wp->pointer;}} void* _WeakPointer_Pointer( wp ) WeakPointer* wp; { return (void*) GC_call_with_alloc_lock( PointerWithLock, wp );} typedef struct EqualClosure { WeakPointer* wp1; WeakPointer* wp2; } EqualClosure; static void* EqualWithLock( ec ) EqualClosure* ec; { if (ec->wp1 == 0 || ec->wp2 == 0) { return (void*) (ec->wp1 == ec->wp2);} else { return (void*) (ec->wp1->pointer == ec->wp2->pointer);}} int _WeakPointer_Equal( wp1, wp2 ) WeakPointer* wp1; WeakPointer* wp2; { EqualClosure ec; ec.wp1 = wp1; ec.wp2 = wp2; return (int) GC_call_with_alloc_lock( EqualWithLock, &ec );} int _WeakPointer_Hash( wp ) WeakPointer* wp; { return (int) _WeakPointer_Pointer( wp );} /************************************************************************** Implementations of the template class CleanUp from WeakPointer.h ***************************************************************************/ typedef struct Closure { void (*c) PROTO(( void* d, void* t )); ptrdiff_t t_offset; void* d; } Closure; static void _CleanUp_CallClosure( obj, data ) void* obj; void* data; { Closure* closure = (Closure*) data; closure->c( closure->d, (char*) obj + closure->t_offset );} void _CleanUp_Set( t, c, d ) void* t; void (*c) PROTO(( void* d, void* t )); void* d; { void* base = GC_base( t ); Descriptor* desc = DESCRIPTOR( t ); if (c == 0) { GC_REGISTER_FINALIZER_IGNORE_SELF( base, 0, 0, 0, 0 ); desc->has_finalizer = 0;} else { Closure* closure = (Closure*) GC_MALLOC( sizeof( Closure ) ); closure->c = c; closure->t_offset = (char*) t - (char*) base; closure->d = d; GC_REGISTER_FINALIZER_IGNORE_SELF( base, _CleanUp_CallClosure, closure, 0, 0 ); desc->has_finalizer = 1;}} void _CleanUp_Call( t ) void* t; { /* ? Aren't we supposed to deactivate weak pointers to t too? Why? */ void* base = GC_base( t ); void* d; GC_finalization_proc f; GC_REGISTER_FINALIZER( base, 0, 0, &f, &d ); f( base, d );} typedef struct QueueElem { void* o; GC_finalization_proc f; void* d; struct QueueElem* next; } QueueElem; void* _CleanUp_Queue_NewHead() { return GC_MALLOC( sizeof( QueueElem ) );} static void _CleanUp_Queue_Enqueue( obj, data ) void* obj; void* data; { QueueElem* q = (QueueElem*) data; QueueElem* head = q->next; q->o = obj; q->next = head->next; head->next = q;} void _CleanUp_Queue_Set( h, t ) void* h; void* t; { QueueElem* head = (QueueElem*) h; void* base = GC_base( t ); void* d; GC_finalization_proc f; QueueElem* q = (QueueElem*) GC_MALLOC( sizeof( QueueElem ) ); GC_REGISTER_FINALIZER( base, _CleanUp_Queue_Enqueue, q, &f, &d ); q->f = f; q->d = d; q->next = head;} int _CleanUp_Queue_Call( h ) void* h; { QueueElem* head = (QueueElem*) h; QueueElem* q = head->next; if (q == 0) { return 0;} else { head->next = q->next; q->next = 0; if (q->f != 0) q->f( q->o, q->d ); return 1;}}