| #!/usr/bin/env python |
| |
| # |
| # Copyright 2012 the V8 project authors. All rights reserved. |
| # Redistribution and use in source and binary forms, with or without |
| # modification, are permitted provided that the following conditions are |
| # met: |
| # |
| # * Redistributions of source code must retain the above copyright |
| # notice, this list of conditions and the following disclaimer. |
| # * Redistributions in binary form must reproduce the above |
| # copyright notice, this list of conditions and the following |
| # disclaimer in the documentation and/or other materials provided |
| # with the distribution. |
| # * Neither the name of Google Inc. nor the names of its |
| # contributors may be used to endorse or promote products derived |
| # from this software without specific prior written permission. |
| # |
| # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS |
| # "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT |
| # LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR |
| # A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT |
| # OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, |
| # SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT |
| # LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, |
| # DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY |
| # THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |
| # (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE |
| # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
| # |
| |
| # |
| # Emits a C++ file to be compiled and linked into libv8 to support postmortem |
| # debugging tools. Most importantly, this tool emits constants describing V8 |
| # internals: |
| # |
| # v8dbg_type_CLASS__TYPE = VALUE Describes class type values |
| # v8dbg_class_CLASS__FIELD__TYPE = OFFSET Describes class fields |
| # v8dbg_parent_CLASS__PARENT Describes class hierarchy |
| # v8dbg_frametype_NAME = VALUE Describes stack frame values |
| # v8dbg_off_fp_NAME = OFFSET Frame pointer offsets |
| # v8dbg_prop_NAME = OFFSET Object property offsets |
| # v8dbg_NAME = VALUE Miscellaneous values |
| # |
| # These constants are declared as global integers so that they'll be present in |
| # the generated libv8 binary. |
| # |
| |
| # for py2/py3 compatibility |
| from __future__ import print_function |
| |
| import io |
| import re |
| import sys |
| |
| # |
| # Miscellaneous constants such as tags and masks used for object identification, |
| # enumeration values used as indexes in internal tables, etc.. |
| # |
| consts_misc = [ |
| { 'name': 'FirstNonstringType', 'value': 'FIRST_NONSTRING_TYPE' }, |
| { 'name': 'APIObjectType', 'value': 'JS_API_OBJECT_TYPE' }, |
| { 'name': 'SpecialAPIObjectType', 'value': 'JS_SPECIAL_API_OBJECT_TYPE' }, |
| |
| { 'name': 'FirstContextType', 'value': 'FIRST_CONTEXT_TYPE' }, |
| { 'name': 'LastContextType', 'value': 'LAST_CONTEXT_TYPE' }, |
| |
| { 'name': 'IsNotStringMask', 'value': 'kIsNotStringMask' }, |
| { 'name': 'StringTag', 'value': 'kStringTag' }, |
| |
| { 'name': 'StringEncodingMask', 'value': 'kStringEncodingMask' }, |
| { 'name': 'TwoByteStringTag', 'value': 'kTwoByteStringTag' }, |
| { 'name': 'OneByteStringTag', 'value': 'kOneByteStringTag' }, |
| |
| { 'name': 'StringRepresentationMask', |
| 'value': 'kStringRepresentationMask' }, |
| { 'name': 'SeqStringTag', 'value': 'kSeqStringTag' }, |
| { 'name': 'ConsStringTag', 'value': 'kConsStringTag' }, |
| { 'name': 'ExternalStringTag', 'value': 'kExternalStringTag' }, |
| { 'name': 'SlicedStringTag', 'value': 'kSlicedStringTag' }, |
| { 'name': 'ThinStringTag', 'value': 'kThinStringTag' }, |
| |
| { 'name': 'HeapObjectTag', 'value': 'kHeapObjectTag' }, |
| { 'name': 'HeapObjectTagMask', 'value': 'kHeapObjectTagMask' }, |
| { 'name': 'SmiTag', 'value': 'kSmiTag' }, |
| { 'name': 'SmiTagMask', 'value': 'kSmiTagMask' }, |
| { 'name': 'SmiValueShift', 'value': 'kSmiTagSize' }, |
| { 'name': 'SmiShiftSize', 'value': 'kSmiShiftSize' }, |
| { 'name': 'SystemPointerSize', 'value': 'kSystemPointerSize' }, |
| { 'name': 'SystemPointerSizeLog2', 'value': 'kSystemPointerSizeLog2' }, |
| { 'name': 'TaggedSize', 'value': 'kTaggedSize' }, |
| { 'name': 'TaggedSizeLog2', 'value': 'kTaggedSizeLog2' }, |
| |
| { 'name': 'OddballFalse', 'value': 'Oddball::kFalse' }, |
| { 'name': 'OddballTrue', 'value': 'Oddball::kTrue' }, |
| { 'name': 'OddballTheHole', 'value': 'Oddball::kTheHole' }, |
| { 'name': 'OddballNull', 'value': 'Oddball::kNull' }, |
| { 'name': 'OddballArgumentsMarker', 'value': 'Oddball::kArgumentsMarker' }, |
| { 'name': 'OddballUndefined', 'value': 'Oddball::kUndefined' }, |
| { 'name': 'OddballUninitialized', 'value': 'Oddball::kUninitialized' }, |
| { 'name': 'OddballOther', 'value': 'Oddball::kOther' }, |
| { 'name': 'OddballException', 'value': 'Oddball::kException' }, |
| |
| { 'name': 'ContextRegister', 'value': 'kContextRegister.code()' }, |
| { 'name': 'ReturnRegister0', 'value': 'kReturnRegister0.code()' }, |
| { 'name': 'JSFunctionRegister', 'value': 'kJSFunctionRegister.code()' }, |
| { 'name': 'InterpreterBytecodeOffsetRegister', |
| 'value': 'kInterpreterBytecodeOffsetRegister.code()' }, |
| { 'name': 'InterpreterBytecodeArrayRegister', |
| 'value': 'kInterpreterBytecodeArrayRegister.code()' }, |
| { 'name': 'RuntimeCallFunctionRegister', |
| 'value': 'kRuntimeCallFunctionRegister.code()' }, |
| |
| { 'name': 'prop_kind_Data', |
| 'value': 'kData' }, |
| { 'name': 'prop_kind_Accessor', |
| 'value': 'kAccessor' }, |
| { 'name': 'prop_kind_mask', |
| 'value': 'PropertyDetails::KindField::kMask' }, |
| { 'name': 'prop_location_Descriptor', |
| 'value': 'kDescriptor' }, |
| { 'name': 'prop_location_Field', |
| 'value': 'kField' }, |
| { 'name': 'prop_location_mask', |
| 'value': 'PropertyDetails::LocationField::kMask' }, |
| { 'name': 'prop_location_shift', |
| 'value': 'PropertyDetails::LocationField::kShift' }, |
| { 'name': 'prop_attributes_NONE', 'value': 'NONE' }, |
| { 'name': 'prop_attributes_READ_ONLY', 'value': 'READ_ONLY' }, |
| { 'name': 'prop_attributes_DONT_ENUM', 'value': 'DONT_ENUM' }, |
| { 'name': 'prop_attributes_DONT_DELETE', 'value': 'DONT_DELETE' }, |
| { 'name': 'prop_attributes_mask', |
| 'value': 'PropertyDetails::AttributesField::kMask' }, |
| { 'name': 'prop_attributes_shift', |
| 'value': 'PropertyDetails::AttributesField::kShift' }, |
| { 'name': 'prop_index_mask', |
| 'value': 'PropertyDetails::FieldIndexField::kMask' }, |
| { 'name': 'prop_index_shift', |
| 'value': 'PropertyDetails::FieldIndexField::kShift' }, |
| { 'name': 'prop_representation_mask', |
| 'value': 'PropertyDetails::RepresentationField::kMask' }, |
| { 'name': 'prop_representation_shift', |
| 'value': 'PropertyDetails::RepresentationField::kShift' }, |
| { 'name': 'prop_representation_smi', |
| 'value': 'Representation::Kind::kSmi' }, |
| { 'name': 'prop_representation_double', |
| 'value': 'Representation::Kind::kDouble' }, |
| { 'name': 'prop_representation_heapobject', |
| 'value': 'Representation::Kind::kHeapObject' }, |
| { 'name': 'prop_representation_tagged', |
| 'value': 'Representation::Kind::kTagged' }, |
| |
| { 'name': 'prop_desc_key', |
| 'value': 'DescriptorArray::kEntryKeyIndex' }, |
| { 'name': 'prop_desc_details', |
| 'value': 'DescriptorArray::kEntryDetailsIndex' }, |
| { 'name': 'prop_desc_value', |
| 'value': 'DescriptorArray::kEntryValueIndex' }, |
| { 'name': 'prop_desc_size', |
| 'value': 'DescriptorArray::kEntrySize' }, |
| |
| { 'name': 'elements_fast_holey_elements', |
| 'value': 'HOLEY_ELEMENTS' }, |
| { 'name': 'elements_fast_elements', |
| 'value': 'PACKED_ELEMENTS' }, |
| { 'name': 'elements_dictionary_elements', |
| 'value': 'DICTIONARY_ELEMENTS' }, |
| |
| { 'name': 'bit_field2_elements_kind_mask', |
| 'value': 'Map::Bits2::ElementsKindBits::kMask' }, |
| { 'name': 'bit_field2_elements_kind_shift', |
| 'value': 'Map::Bits2::ElementsKindBits::kShift' }, |
| { 'name': 'bit_field3_is_dictionary_map_shift', |
| 'value': 'Map::Bits3::IsDictionaryMapBit::kShift' }, |
| { 'name': 'bit_field3_number_of_own_descriptors_mask', |
| 'value': 'Map::Bits3::NumberOfOwnDescriptorsBits::kMask' }, |
| { 'name': 'bit_field3_number_of_own_descriptors_shift', |
| 'value': 'Map::Bits3::NumberOfOwnDescriptorsBits::kShift' }, |
| { 'name': 'class_Map__instance_descriptors_offset', |
| 'value': 'Map::kInstanceDescriptorsOffset' }, |
| |
| { 'name': 'off_fp_context_or_frame_type', |
| 'value': 'CommonFrameConstants::kContextOrFrameTypeOffset'}, |
| { 'name': 'off_fp_context', |
| 'value': 'StandardFrameConstants::kContextOffset' }, |
| { 'name': 'off_fp_constant_pool', |
| 'value': 'StandardFrameConstants::kConstantPoolOffset' }, |
| { 'name': 'off_fp_function', |
| 'value': 'StandardFrameConstants::kFunctionOffset' }, |
| { 'name': 'off_fp_args', |
| 'value': 'StandardFrameConstants::kFixedFrameSizeAboveFp' }, |
| |
| { 'name': 'scopeinfo_idx_nparams', |
| 'value': 'ScopeInfo::kParameterCount' }, |
| { 'name': 'scopeinfo_idx_ncontextlocals', |
| 'value': 'ScopeInfo::kContextLocalCount' }, |
| { 'name': 'scopeinfo_idx_first_vars', |
| 'value': 'ScopeInfo::kVariablePartIndex' }, |
| |
| { 'name': 'jsarray_buffer_was_detached_mask', |
| 'value': 'JSArrayBuffer::WasDetachedBit::kMask' }, |
| { 'name': 'jsarray_buffer_was_detached_shift', |
| 'value': 'JSArrayBuffer::WasDetachedBit::kShift' }, |
| |
| { 'name': 'context_idx_scope_info', |
| 'value': 'Context::SCOPE_INFO_INDEX' }, |
| { 'name': 'context_idx_prev', |
| 'value': 'Context::PREVIOUS_INDEX' }, |
| { 'name': 'context_min_slots', |
| 'value': 'Context::MIN_CONTEXT_SLOTS' }, |
| { 'name': 'native_context_embedder_data_offset', |
| 'value': 'Internals::kNativeContextEmbedderDataOffset' }, |
| |
| |
| { 'name': 'namedictionaryshape_prefix_size', |
| 'value': 'NameDictionaryShape::kPrefixSize' }, |
| { 'name': 'namedictionaryshape_entry_size', |
| 'value': 'NameDictionaryShape::kEntrySize' }, |
| { 'name': 'globaldictionaryshape_entry_size', |
| 'value': 'GlobalDictionaryShape::kEntrySize' }, |
| |
| { 'name': 'namedictionary_prefix_start_index', |
| 'value': 'NameDictionary::kPrefixStartIndex' }, |
| |
| { 'name': 'numberdictionaryshape_prefix_size', |
| 'value': 'NumberDictionaryShape::kPrefixSize' }, |
| { 'name': 'numberdictionaryshape_entry_size', |
| 'value': 'NumberDictionaryShape::kEntrySize' }, |
| |
| { 'name': 'simplenumberdictionaryshape_prefix_size', |
| 'value': 'SimpleNumberDictionaryShape::kPrefixSize' }, |
| { 'name': 'simplenumberdictionaryshape_entry_size', |
| 'value': 'SimpleNumberDictionaryShape::kEntrySize' }, |
| |
| { 'name': 'type_JSError__JS_ERROR_TYPE', 'value': 'JS_ERROR_TYPE' }, |
| ]; |
| |
| # |
| # The following useful fields are missing accessors, so we define fake ones. |
| # Please note that extra accessors should _only_ be added to expose offsets that |
| # can be used to access actual V8 objects' properties. They should not be added |
| # for exposing other values. For instance, enumeration values or class' |
| # constants should be exposed by adding an entry in the "consts_misc" table, not |
| # in this "extras_accessors" table. |
| # |
| extras_accessors = [ |
| 'JSFunction, context, Context, kContextOffset', |
| 'JSFunction, shared, SharedFunctionInfo, kSharedFunctionInfoOffset', |
| 'HeapObject, map, Map, kMapOffset', |
| 'JSObject, elements, Object, kElementsOffset', |
| 'JSObject, internal_fields, uintptr_t, kHeaderSize', |
| 'FixedArray, data, uintptr_t, kHeaderSize', |
| 'JSArrayBuffer, backing_store, uintptr_t, kBackingStoreOffset', |
| 'JSArrayBuffer, byte_length, size_t, kByteLengthOffset', |
| 'JSArrayBufferView, byte_length, size_t, kByteLengthOffset', |
| 'JSArrayBufferView, byte_offset, size_t, kByteOffsetOffset', |
| 'JSDate, value, Object, kValueOffset', |
| 'JSRegExp, source, Object, kSourceOffset', |
| 'JSTypedArray, external_pointer, uintptr_t, kExternalPointerOffset', |
| 'JSTypedArray, length, Object, kLengthOffset', |
| 'Map, instance_size_in_words, char, kInstanceSizeInWordsOffset', |
| 'Map, inobject_properties_start_or_constructor_function_index, char, kInObjectPropertiesStartOrConstructorFunctionIndexOffset', |
| 'Map, instance_type, uint16_t, kInstanceTypeOffset', |
| 'Map, bit_field, char, kBitFieldOffset', |
| 'Map, bit_field2, char, kBitField2Offset', |
| 'Map, bit_field3, int, kBitField3Offset', |
| 'Map, prototype, Object, kPrototypeOffset', |
| 'Oddball, kind_offset, int, kKindOffset', |
| 'HeapNumber, value, double, kValueOffset', |
| 'ExternalString, resource, Object, kResourceOffset', |
| 'SeqOneByteString, chars, char, kHeaderSize', |
| 'SeqTwoByteString, chars, char, kHeaderSize', |
| 'UncompiledData, inferred_name, String, kInferredNameOffset', |
| 'UncompiledData, start_position, int32_t, kStartPositionOffset', |
| 'UncompiledData, end_position, int32_t, kEndPositionOffset', |
| 'SharedFunctionInfo, raw_function_token_offset, int16_t, kFunctionTokenOffsetOffset', |
| 'SharedFunctionInfo, internal_formal_parameter_count, uint16_t, kFormalParameterCountOffset', |
| 'SharedFunctionInfo, flags, int, kFlagsOffset', |
| 'SharedFunctionInfo, length, uint16_t, kLengthOffset', |
| 'SlicedString, parent, String, kParentOffset', |
| 'Code, instruction_start, uintptr_t, kHeaderSize', |
| 'Code, instruction_size, int, kInstructionSizeOffset', |
| 'String, length, int32_t, kLengthOffset', |
| 'DescriptorArray, header_size, uintptr_t, kHeaderSize', |
| 'ConsString, first, String, kFirstOffset', |
| 'ConsString, second, String, kSecondOffset', |
| 'SlicedString, offset, SMI, kOffsetOffset', |
| 'ThinString, actual, String, kActualOffset', |
| 'Symbol, name, Object, kDescriptionOffset', |
| ]; |
| |
| # |
| # The following is a whitelist of classes we expect to find when scanning the |
| # source code. This list is not exhaustive, but it's still useful to identify |
| # when this script gets out of sync with the source. See load_objects(). |
| # |
| expected_classes = [ |
| 'ConsString', 'FixedArray', 'HeapNumber', 'JSArray', 'JSFunction', |
| 'JSObject', 'JSRegExp', 'JSPrimitiveWrapper', 'Map', 'Oddball', 'Script', |
| 'SeqOneByteString', 'SharedFunctionInfo', 'ScopeInfo', 'JSPromise', |
| 'DescriptorArray' |
| ]; |
| |
| |
| # |
| # The following structures store high-level representations of the structures |
| # for which we're going to emit descriptive constants. |
| # |
| types = {}; # set of all type names |
| typeclasses = {}; # maps type names to corresponding class names |
| klasses = {}; # known classes, including parents |
| fields = []; # field declarations |
| |
| header = ''' |
| /* |
| * This file is generated by %s. Do not edit directly. |
| */ |
| |
| #include "src/init/v8.h" |
| #include "src/codegen/register-arch.h" |
| #include "src/execution/frames.h" |
| #include "src/execution/frames-inl.h" /* for architecture-specific frame constants */ |
| #include "src/objects/contexts.h" |
| #include "src/objects/objects.h" |
| #include "src/objects/data-handler.h" |
| #include "src/objects/js-promise.h" |
| #include "src/objects/js-regexp-string-iterator.h" |
| |
| namespace v8 { |
| namespace internal { |
| |
| extern "C" { |
| |
| /* stack frame constants */ |
| #define FRAME_CONST(value, klass) \ |
| V8_EXPORT int v8dbg_frametype_##klass = StackFrame::value; |
| |
| STACK_FRAME_TYPE_LIST(FRAME_CONST) |
| |
| #undef FRAME_CONST |
| |
| ''' % sys.argv[0]; |
| |
| footer = ''' |
| } |
| |
| } |
| } |
| ''' |
| |
| # |
| # Get the base class |
| # |
| def get_base_class(klass): |
| if (klass == 'Object'): |
| return klass; |
| |
| if (not (klass in klasses)): |
| return None; |
| |
| k = klasses[klass]; |
| |
| return get_base_class(k['parent']); |
| |
| # |
| # Loads class hierarchy and type information from "objects.h" etc. |
| # |
| def load_objects(): |
| # |
| # Construct a dictionary for the classes we're sure should be present. |
| # |
| checktypes = {}; |
| for klass in expected_classes: |
| checktypes[klass] = True; |
| |
| |
| for filename in sys.argv[2:]: |
| if not filename.endswith("-inl.h"): |
| load_objects_from_file(filename, checktypes) |
| |
| if (len(checktypes) > 0): |
| for klass in checktypes: |
| print('error: expected class \"%s\" not found' % klass); |
| |
| sys.exit(1); |
| |
| |
| def load_objects_from_file(objfilename, checktypes): |
| objfile = io.open(objfilename, 'r', encoding='utf-8'); |
| in_insttype = False; |
| in_torque_insttype = False |
| in_torque_fulldef = False |
| |
| typestr = ''; |
| torque_typestr = '' |
| torque_fulldefstr = '' |
| uncommented_file = '' |
| |
| # |
| # Iterate the header file line-by-line to collect type and class |
| # information. For types, we accumulate a string representing the entire |
| # InstanceType enum definition and parse it later because it's easier to |
| # do so without the embedded newlines. |
| # |
| for line in objfile: |
| if (line.startswith('enum InstanceType : uint16_t {')): |
| in_insttype = True; |
| continue; |
| |
| if (line.startswith('#define TORQUE_ASSIGNED_INSTANCE_TYPE_LIST')): |
| in_torque_insttype = True |
| continue |
| |
| if (line.startswith('#define TORQUE_INSTANCE_CHECKERS_SINGLE_FULLY_DEFINED')): |
| in_torque_fulldef = True |
| continue |
| |
| if (in_insttype and line.startswith('};')): |
| in_insttype = False; |
| continue; |
| |
| if (in_torque_insttype and (not line or line.isspace())): |
| in_torque_insttype = False |
| continue |
| |
| if (in_torque_fulldef and (not line or line.isspace())): |
| in_torque_fulldef = False |
| continue |
| |
| line = re.sub('//.*', '', line.strip()); |
| |
| if (in_insttype): |
| typestr += line; |
| continue; |
| |
| if (in_torque_insttype): |
| torque_typestr += line |
| continue |
| |
| if (in_torque_fulldef): |
| torque_fulldefstr += line |
| continue |
| |
| uncommented_file += '\n' + line |
| |
| for match in re.finditer(r'\nclass(?:\s+V8_EXPORT(?:_PRIVATE)?)?' |
| r'\s+(\w[^:;]*)' |
| r'(?:: public (\w[^{]*))?\s*{\s*', |
| uncommented_file): |
| klass = match.group(1).strip(); |
| pklass = match.group(2); |
| if (pklass): |
| # Check for generated Torque class. |
| gen_match = re.match( |
| r'TorqueGenerated\w+\s*<\s*\w+,\s*(\w+)\s*>', |
| pklass) |
| if (gen_match): |
| pklass = gen_match.group(1) |
| # Strip potential template arguments from parent |
| # class. |
| match = re.match(r'(\w+)(<.*>)?', pklass.strip()); |
| pklass = match.group(1).strip(); |
| klasses[klass] = { 'parent': pklass }; |
| |
| # |
| # Process the instance type declaration. |
| # |
| entries = typestr.split(','); |
| for entry in entries: |
| types[re.sub('\s*=.*', '', entry).lstrip()] = True; |
| entries = torque_typestr.split('\\') |
| for entry in entries: |
| types[re.sub(r' *V\(|\) *', '', entry)] = True |
| entries = torque_fulldefstr.split('\\') |
| for entry in entries: |
| entry = entry.strip() |
| if not entry: |
| continue |
| idx = entry.find('('); |
| rest = entry[idx + 1: len(entry) - 1]; |
| args = re.split('\s*,\s*', rest); |
| typename = args[0] |
| typeconst = args[1] |
| types[typeconst] = True |
| typeclasses[typeconst] = typename |
| # |
| # Infer class names for each type based on a systematic transformation. |
| # For example, "JS_FUNCTION_TYPE" becomes "JSFunction". We find the |
| # class for each type rather than the other way around because there are |
| # fewer cases where one type maps to more than one class than the other |
| # way around. |
| # |
| for type in types: |
| usetype = type |
| |
| # |
| # Remove the "_TYPE" suffix and then convert to camel case, |
| # except that a "JS" prefix remains uppercase (as in |
| # "JS_FUNCTION_TYPE" => "JSFunction"). |
| # |
| if (not usetype.endswith('_TYPE')): |
| continue; |
| |
| usetype = usetype[0:len(usetype) - len('_TYPE')]; |
| parts = usetype.split('_'); |
| cctype = ''; |
| |
| if (parts[0] == 'JS'): |
| cctype = 'JS'; |
| start = 1; |
| else: |
| cctype = ''; |
| start = 0; |
| |
| for ii in range(start, len(parts)): |
| part = parts[ii]; |
| cctype += part[0].upper() + part[1:].lower(); |
| |
| # |
| # Mapping string types is more complicated. Both types and |
| # class names for Strings specify a representation (e.g., Seq, |
| # Cons, External, or Sliced) and an encoding (TwoByte/OneByte), |
| # In the simplest case, both of these are explicit in both |
| # names, as in: |
| # |
| # EXTERNAL_ONE_BYTE_STRING_TYPE => ExternalOneByteString |
| # |
| # However, either the representation or encoding can be omitted |
| # from the type name, in which case "Seq" and "TwoByte" are |
| # assumed, as in: |
| # |
| # STRING_TYPE => SeqTwoByteString |
| # |
| # Additionally, sometimes the type name has more information |
| # than the class, as in: |
| # |
| # CONS_ONE_BYTE_STRING_TYPE => ConsString |
| # |
| # To figure this out dynamically, we first check for a |
| # representation and encoding and add them if they're not |
| # present. If that doesn't yield a valid class name, then we |
| # strip out the representation. |
| # |
| if (cctype.endswith('String')): |
| if (cctype.find('Cons') == -1 and |
| cctype.find('External') == -1 and |
| cctype.find('Sliced') == -1): |
| if (cctype.find('OneByte') != -1): |
| cctype = re.sub('OneByteString$', |
| 'SeqOneByteString', cctype); |
| else: |
| cctype = re.sub('String$', |
| 'SeqString', cctype); |
| |
| if (cctype.find('OneByte') == -1): |
| cctype = re.sub('String$', 'TwoByteString', |
| cctype); |
| |
| if (not (cctype in klasses)): |
| cctype = re.sub('OneByte', '', cctype); |
| cctype = re.sub('TwoByte', '', cctype); |
| |
| # |
| # Despite all that, some types have no corresponding class. |
| # |
| if (cctype in klasses): |
| typeclasses[type] = cctype; |
| if (cctype in checktypes): |
| del checktypes[cctype]; |
| |
| # |
| # For a given macro call, pick apart the arguments and return an object |
| # describing the corresponding output constant. See load_fields(). |
| # |
| def parse_field(call): |
| # Replace newlines with spaces. |
| for ii in range(0, len(call)): |
| if (call[ii] == '\n'): |
| call[ii] == ' '; |
| |
| idx = call.find('('); |
| kind = call[0:idx]; |
| rest = call[idx + 1: len(call) - 1]; |
| args = re.split('\s*,\s*', rest); |
| |
| consts = []; |
| |
| klass = args[0]; |
| field = args[1]; |
| dtype = None |
| offset = None |
| if kind.startswith('WEAK_ACCESSORS'): |
| dtype = 'weak' |
| offset = args[2]; |
| elif not (kind.startswith('SMI_ACCESSORS') or kind.startswith('ACCESSORS_TO_SMI')): |
| dtype = args[2].replace('<', '_').replace('>', '_') |
| offset = args[3]; |
| else: |
| offset = args[2]; |
| dtype = 'SMI' |
| |
| |
| assert(offset is not None and dtype is not None); |
| return ({ |
| 'name': 'class_%s__%s__%s' % (klass, field, dtype), |
| 'value': '%s::%s' % (klass, offset) |
| }); |
| |
| # |
| # Load field offset information from objects-inl.h etc. |
| # |
| def load_fields(): |
| for filename in sys.argv[2:]: |
| if filename.endswith("-inl.h"): |
| load_fields_from_file(filename) |
| |
| for body in extras_accessors: |
| fields.append(parse_field('ACCESSORS(%s)' % body)); |
| |
| |
| def load_fields_from_file(filename): |
| inlfile = io.open(filename, 'r', encoding='utf-8'); |
| |
| # |
| # Each class's fields and the corresponding offsets are described in the |
| # source by calls to macros like "ACCESSORS" (and friends). All we do |
| # here is extract these macro invocations, taking into account that they |
| # may span multiple lines and may contain nested parentheses. We also |
| # call parse_field() to pick apart the invocation. |
| # |
| prefixes = [ 'ACCESSORS', 'ACCESSORS2', 'ACCESSORS_GCSAFE', |
| 'SMI_ACCESSORS', 'ACCESSORS_TO_SMI', |
| 'RELEASE_ACQUIRE_ACCESSORS', 'WEAK_ACCESSORS' ]; |
| prefixes += ([ prefix + "_CHECKED" for prefix in prefixes ] + |
| [ prefix + "_CHECKED2" for prefix in prefixes ]) |
| current = ''; |
| opens = 0; |
| |
| for line in inlfile: |
| if (opens > 0): |
| # Continuation line |
| for ii in range(0, len(line)): |
| if (line[ii] == '('): |
| opens += 1; |
| elif (line[ii] == ')'): |
| opens -= 1; |
| |
| if (opens == 0): |
| break; |
| |
| current += line[0:ii + 1]; |
| continue; |
| |
| for prefix in prefixes: |
| if (not line.startswith(prefix + '(')): |
| continue; |
| |
| if (len(current) > 0): |
| fields.append(parse_field(current)); |
| current = ''; |
| |
| for ii in range(len(prefix), len(line)): |
| if (line[ii] == '('): |
| opens += 1; |
| elif (line[ii] == ')'): |
| opens -= 1; |
| |
| if (opens == 0): |
| break; |
| |
| current += line[0:ii + 1]; |
| |
| if (len(current) > 0): |
| fields.append(parse_field(current)); |
| current = ''; |
| |
| # |
| # Emit a block of constants. |
| # |
| def emit_set(out, consts): |
| lines = set() # To remove duplicates. |
| |
| # Fix up overzealous parses. This could be done inside the |
| # parsers but as there are several, it's easiest to do it here. |
| ws = re.compile('\s+') |
| for const in consts: |
| name = ws.sub('', const['name']) |
| value = ws.sub('', str(const['value'])) # Can be a number. |
| lines.add('V8_EXPORT int v8dbg_%s = %s;\n' % (name, value)) |
| |
| for line in lines: |
| out.write(line); |
| out.write('\n'); |
| |
| # |
| # Emit the whole output file. |
| # |
| def emit_config(): |
| out = open(sys.argv[1], 'w'); |
| |
| out.write(header); |
| |
| out.write('/* miscellaneous constants */\n'); |
| emit_set(out, consts_misc); |
| |
| out.write('/* class type information */\n'); |
| consts = []; |
| for typename in sorted(typeclasses): |
| klass = typeclasses[typename]; |
| consts.append({ |
| 'name': 'type_%s__%s' % (klass, typename), |
| 'value': typename |
| }); |
| |
| emit_set(out, consts); |
| |
| out.write('/* class hierarchy information */\n'); |
| consts = []; |
| for klassname in sorted(klasses): |
| pklass = klasses[klassname]['parent']; |
| bklass = get_base_class(klassname); |
| if (bklass != 'Object'): |
| continue; |
| if (pklass == None): |
| continue; |
| |
| consts.append({ |
| 'name': 'parent_%s__%s' % (klassname, pklass), |
| 'value': 0 |
| }); |
| |
| emit_set(out, consts); |
| |
| out.write('/* field information */\n'); |
| emit_set(out, fields); |
| |
| out.write(footer); |
| |
| if (len(sys.argv) < 4): |
| print('usage: %s output.cc objects.h objects-inl.h' % sys.argv[0]); |
| sys.exit(2); |
| |
| load_objects(); |
| load_fields(); |
| emit_config(); |