CoCalc -- compactHashtable.cpp

GitHub Repository: PojavLauncherTeam/mobile
Path: blob/master/src/hotspot/share/classfile/compactHashtable.cpp
⁴⁰⁹⁴⁹ views
1
/*
2
 * Copyright (c) 1997, 2021, Oracle and/or its affiliates. All rights reserved.
3
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
4
 *
5
 * This code is free software; you can redistribute it and/or modify it
6
 * under the terms of the GNU General Public License version 2 only, as
7
 * published by the Free Software Foundation.
8
 *
9
 * This code is distributed in the hope that it will be useful, but WITHOUT
10
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
12
 * version 2 for more details (a copy is included in the LICENSE file that
13
 * accompanied this code).
14
 *
15
 * You should have received a copy of the GNU General Public License version
16
 * 2 along with this work; if not, write to the Free Software Foundation,
17
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
18
 *
19
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
20
 * or visit www.oracle.com if you need additional information or have any
21
 * questions.
22
 *
23
 */
24

25
#include "precompiled.hpp"
26
#include "jvm.h"
27
#include "cds/archiveBuilder.hpp"
28
#include "cds/heapShared.inline.hpp"
29
#include "classfile/compactHashtable.hpp"
30
#include "classfile/javaClasses.hpp"
31
#include "logging/logMessage.hpp"
32
#include "memory/metadataFactory.hpp"
33
#include "runtime/arguments.hpp"
34
#include "runtime/globals.hpp"
35
#include "runtime/vmThread.hpp"
36
#include "utilities/numberSeq.hpp"
37
#include <sys/stat.h>
38

39
#if INCLUDE_CDS
40
/////////////////////////////////////////////////////
41
//
42
// The compact hash table writer implementations
43
//
44
CompactHashtableWriter::CompactHashtableWriter(int num_entries,
45
                                               CompactHashtableStats* stats) {
46
  Arguments::assert_is_dumping_archive();
47
  assert(num_entries >= 0, "sanity");
48
  _num_buckets = calculate_num_buckets(num_entries);
49
  assert(_num_buckets > 0, "no buckets");
50

51
  _num_entries_written = 0;
52
  _buckets = NEW_C_HEAP_ARRAY(GrowableArray<Entry>*, _num_buckets, mtSymbol);
53
  for (int i=0; i<_num_buckets; i++) {
54
    _buckets[i] = new (ResourceObj::C_HEAP, mtSymbol) GrowableArray<Entry>(0, mtSymbol);
55
  }
56

57
  _stats = stats;
58
  _compact_buckets = NULL;
59
  _compact_entries = NULL;
60
  _num_empty_buckets = 0;
61
  _num_value_only_buckets = 0;
62
  _num_other_buckets = 0;
63
}
64

65
CompactHashtableWriter::~CompactHashtableWriter() {
66
  for (int index = 0; index < _num_buckets; index++) {
67
    GrowableArray<Entry>* bucket = _buckets[index];
68
    delete bucket;
69
  }
70

71
  FREE_C_HEAP_ARRAY(GrowableArray<Entry>*, _buckets);
72
}
73

74
size_t CompactHashtableWriter::estimate_size(int num_entries) {
75
  int num_buckets = calculate_num_buckets(num_entries);
76
  size_t bucket_bytes = ArchiveBuilder::ro_array_bytesize<u4>(num_buckets + 1);
77

78
  // In worst case, we have no VALUE_ONLY_BUCKET_TYPE, so each entry takes 2 slots
79
  int entries_space = 2 * num_entries;
80
  size_t entry_bytes = ArchiveBuilder::ro_array_bytesize<u4>(entries_space);
81

82
  return bucket_bytes
83
       + entry_bytes
84
       + SimpleCompactHashtable::calculate_header_size();
85
}
86

87
// Add a symbol entry to the temporary hash table
88
void CompactHashtableWriter::add(unsigned int hash, u4 value) {
89
  int index = hash % _num_buckets;
90
  _buckets[index]->append_if_missing(Entry(hash, value));
91
  _num_entries_written++;
92
}
93

94
void CompactHashtableWriter::allocate_table() {
95
  int entries_space = 0;
96
  for (int index = 0; index < _num_buckets; index++) {
97
    GrowableArray<Entry>* bucket = _buckets[index];
98
    int bucket_size = bucket->length();
99
    if (bucket_size == 1) {
100
      entries_space++;
101
    } else if (bucket_size > 1) {
102
      entries_space += 2 * bucket_size;
103
    }
104
  }
105

106
  if (entries_space & ~BUCKET_OFFSET_MASK) {
107
    vm_exit_during_initialization("CompactHashtableWriter::allocate_table: Overflow! "
108
                                  "Too many entries.");
109
  }
110

111
  _compact_buckets = ArchiveBuilder::new_ro_array<u4>(_num_buckets + 1);
112
  _compact_entries = ArchiveBuilder::new_ro_array<u4>(entries_space);
113

114
  _stats->bucket_count    = _num_buckets;
115
  _stats->bucket_bytes    = align_up(_compact_buckets->size() * BytesPerWord,
116
                                     SharedSpaceObjectAlignment);
117
  _stats->hashentry_count = _num_entries_written;
118
  _stats->hashentry_bytes = align_up(_compact_entries->size() * BytesPerWord,
119
                                     SharedSpaceObjectAlignment);
120
}
121

122
// Write the compact table's buckets
123
void CompactHashtableWriter::dump_table(NumberSeq* summary) {
124
  u4 offset = 0;
125
  for (int index = 0; index < _num_buckets; index++) {
126
    GrowableArray<Entry>* bucket = _buckets[index];
127
    int bucket_size = bucket->length();
128
    if (bucket_size == 1) {
129
      // bucket with one entry is compacted and only has the symbol offset
130
      _compact_buckets->at_put(index, BUCKET_INFO(offset, VALUE_ONLY_BUCKET_TYPE));
131

132
      Entry ent = bucket->at(0);
133
      _compact_entries->at_put(offset++, ent.value());
134
      _num_value_only_buckets++;
135
    } else {
136
      // regular bucket, each entry is a symbol (hash, offset) pair
137
      _compact_buckets->at_put(index, BUCKET_INFO(offset, REGULAR_BUCKET_TYPE));
138

139
      for (int i=0; i<bucket_size; i++) {
140
        Entry ent = bucket->at(i);
141
        _compact_entries->at_put(offset++, u4(ent.hash())); // write entry hash
142
        _compact_entries->at_put(offset++, ent.value());
143
      }
144
      if (bucket_size == 0) {
145
        _num_empty_buckets++;
146
      } else {
147
        _num_other_buckets++;
148
      }
149
    }
150
    summary->add(bucket_size);
151
  }
152

153
  // Mark the end of the buckets
154
  _compact_buckets->at_put(_num_buckets, BUCKET_INFO(offset, TABLEEND_BUCKET_TYPE));
155
  assert(offset == (u4)_compact_entries->length(), "sanity");
156
}
157

158

159
// Write the compact table
160
void CompactHashtableWriter::dump(SimpleCompactHashtable *cht, const char* table_name) {
161
  NumberSeq summary;
162
  allocate_table();
163
  dump_table(&summary);
164

165
  int table_bytes = _stats->bucket_bytes + _stats->hashentry_bytes;
166
  address base_address = address(SharedBaseAddress);
167
  cht->init(base_address,  _num_entries_written, _num_buckets,
168
            _compact_buckets->data(), _compact_entries->data());
169

170
  LogMessage(cds, hashtables) msg;
171
  if (msg.is_info()) {
172
    double avg_cost = 0.0;
173
    if (_num_entries_written > 0) {
174
      avg_cost = double(table_bytes)/double(_num_entries_written);
175
    }
176
    msg.info("Shared %s table stats -------- base: " PTR_FORMAT,
177
                         table_name, (intptr_t)base_address);
178
    msg.info("Number of entries       : %9d", _num_entries_written);
179
    msg.info("Total bytes used        : %9d", table_bytes);
180
    msg.info("Average bytes per entry : %9.3f", avg_cost);
181
    msg.info("Average bucket size     : %9.3f", summary.avg());
182
    msg.info("Variance of bucket size : %9.3f", summary.variance());
183
    msg.info("Std. dev. of bucket size: %9.3f", summary.sd());
184
    msg.info("Maximum bucket size     : %9d", (int)summary.maximum());
185
    msg.info("Empty buckets           : %9d", _num_empty_buckets);
186
    msg.info("Value_Only buckets      : %9d", _num_value_only_buckets);
187
    msg.info("Other buckets           : %9d", _num_other_buckets);
188
  }
189
}
190

191
/////////////////////////////////////////////////////////////
192
//
193
// The CompactHashtable implementation
194
//
195

196
void SimpleCompactHashtable::init(address base_address, u4 entry_count, u4 bucket_count, u4* buckets, u4* entries) {
197
  _bucket_count = bucket_count;
198
  _entry_count = entry_count;
199
  _base_address = base_address;
200
  _buckets = buckets;
201
  _entries = entries;
202
}
203

204
size_t SimpleCompactHashtable::calculate_header_size() {
205
  // We have 5 fields. Each takes up sizeof(intptr_t). See WriteClosure::do_u4
206
  size_t bytes = sizeof(intptr_t) * 5;
207
  return bytes;
208
}
209

210
void SimpleCompactHashtable::serialize_header(SerializeClosure* soc) {
211
  // NOTE: if you change this function, you MUST change the number 5 in
212
  // calculate_header_size() accordingly.
213
  soc->do_u4(&_entry_count);
214
  soc->do_u4(&_bucket_count);
215
  soc->do_ptr((void**)&_buckets);
216
  soc->do_ptr((void**)&_entries);
217
  if (soc->reading()) {
218
    _base_address = (address)SharedBaseAddress;
219
  }
220
}
221
#endif // INCLUDE_CDS
222

223
#ifndef O_BINARY       // if defined (Win32) use binary files.
224
#define O_BINARY 0     // otherwise do nothing.
225
#endif
226

227
////////////////////////////////////////////////////////
228
//
229
// HashtableTextDump
230
//
231
HashtableTextDump::HashtableTextDump(const char* filename) : _fd(-1) {
232
  struct stat st;
233
  if (os::stat(filename, &st) != 0) {
234
    quit("Unable to get hashtable dump file size", filename);
235
  }
236
  _size = st.st_size;
237
  _fd = os::open(filename, O_RDONLY | O_BINARY, 0);
238
  if (_fd < 0) {
239
    quit("Unable to open hashtable dump file", filename);
240
  }
241
  _base = os::map_memory(_fd, filename, 0, NULL, _size, true, false);
242
  if (_base == NULL) {
243
    quit("Unable to map hashtable dump file", filename);
244
  }
245
  _p = _base;
246
  _end = _base + st.st_size;
247
  _filename = filename;
248
  _prefix_type = Unknown;
249
  _line_no = 1;
250
}
251

252
HashtableTextDump::~HashtableTextDump() {
253
  os::unmap_memory((char*)_base, _size);
254
  if (_fd >= 0) {
255
    close(_fd);
256
  }
257
}
258

259
void HashtableTextDump::quit(const char* err, const char* msg) {
260
  vm_exit_during_initialization(err, msg);
261
}
262

263
void HashtableTextDump::corrupted(const char *p, const char* msg) {
264
  char info[100];
265
  jio_snprintf(info, sizeof(info),
266
               "%s. Corrupted at line %d (file pos %d)",
267
               msg, _line_no, (int)(p - _base));
268
  quit(info, _filename);
269
}
270

271
bool HashtableTextDump::skip_newline() {
272
  if (_p[0] == '\r' && _p[1] == '\n') {
273
    _p += 2;
274
  } else if (_p[0] == '\n') {
275
    _p += 1;
276
  } else {
277
    corrupted(_p, "Unexpected character");
278
  }
279
  _line_no++;
280
  return true;
281
}
282

283
int HashtableTextDump::skip(char must_be_char) {
284
  corrupted_if(remain() < 1, "Truncated");
285
  corrupted_if(*_p++ != must_be_char, "Unexpected character");
286
  return 0;
287
}
288

289
void HashtableTextDump::skip_past(char c) {
290
  for (;;) {
291
    corrupted_if(remain() < 1, "Truncated");
292
    if (*_p++ == c) {
293
      return;
294
    }
295
  }
296
}
297

298
void HashtableTextDump::check_version(const char* ver) {
299
  int len = (int)strlen(ver);
300
  corrupted_if(remain() < len, "Truncated");
301
  if (strncmp(_p, ver, len) != 0) {
302
    quit("wrong version of hashtable dump file", _filename);
303
  }
304
  _p += len;
305
  skip_newline();
306
}
307

308
void HashtableTextDump::scan_prefix_type() {
309
  _p++;
310
  if (strncmp(_p, "SECTION: String", 15) == 0) {
311
    _p += 15;
312
    _prefix_type = StringPrefix;
313
  } else if (strncmp(_p, "SECTION: Symbol", 15) == 0) {
314
    _p += 15;
315
    _prefix_type = SymbolPrefix;
316
  } else {
317
    _prefix_type = Unknown;
318
  }
319
  skip_newline();
320
}
321

322
int HashtableTextDump::scan_prefix(int* utf8_length) {
323
  if (*_p == '@') {
324
    scan_prefix_type();
325
  }
326

327
  switch (_prefix_type) {
328
  case SymbolPrefix:
329
    *utf8_length = scan_symbol_prefix(); break;
330
  case StringPrefix:
331
    *utf8_length = scan_string_prefix(); break;
332
  default:
333
    tty->print_cr("Shared input data type: Unknown.");
334
    corrupted(_p, "Unknown data type");
335
  }
336

337
  return _prefix_type;
338
}
339

340
int HashtableTextDump::scan_string_prefix() {
341
  // Expect /[0-9]+: /
342
  int utf8_length = 0;
343
  get_num(':', &utf8_length);
344
  if (*_p != ' ') {
345
    corrupted(_p, "Wrong prefix format for string");
346
  }
347
  _p++;
348
  return utf8_length;
349
}
350

351
int HashtableTextDump::scan_symbol_prefix() {
352
  // Expect /[0-9]+ (-|)[0-9]+: /
353
  int utf8_length = 0;
354
  get_num(' ', &utf8_length);
355
  if (*_p == '-') {
356
    _p++;
357
  }
358
  int ref_num;
359
  get_num(':', &ref_num);
360
  if (*_p != ' ') {
361
    corrupted(_p, "Wrong prefix format for symbol");
362
  }
363
  _p++;
364
  return utf8_length;
365
}
366

367
jchar HashtableTextDump::unescape(const char* from, const char* end, int count) {
368
  jchar value = 0;
369

370
  corrupted_if(from + count > end, "Truncated");
371

372
  for (int i=0; i<count; i++) {
373
    char c = *from++;
374
    switch (c) {
375
    case '0': case '1': case '2': case '3': case '4':
376
    case '5': case '6': case '7': case '8': case '9':
377
      value = (value << 4) + c - '0';
378
      break;
379
    case 'a': case 'b': case 'c':
380
    case 'd': case 'e': case 'f':
381
      value = (value << 4) + 10 + c - 'a';
382
      break;
383
    case 'A': case 'B': case 'C':
384
    case 'D': case 'E': case 'F':
385
      value = (value << 4) + 10 + c - 'A';
386
      break;
387
    default:
388
      ShouldNotReachHere();
389
    }
390
  }
391
  return value;
392
}
393

394
void HashtableTextDump::get_utf8(char* utf8_buffer, int utf8_length) {
395
  // cache in local vars
396
  const char* from = _p;
397
  const char* end = _end;
398
  char* to = utf8_buffer;
399
  int n = utf8_length;
400

401
  for (; n > 0 && from < end; n--) {
402
    if (*from != '\\') {
403
      *to++ = *from++;
404
    } else {
405
      corrupted_if(from + 2 > end, "Truncated");
406
      char c = from[1];
407
      from += 2;
408
      switch (c) {
409
      case 'x':
410
        {
411
          jchar value = unescape(from, end, 2);
412
          from += 2;
413
          assert(value <= 0xff, "sanity");
414
          *to++ = (char)(value & 0xff);
415
        }
416
        break;
417
      case 't':  *to++ = '\t'; break;
418
      case 'n':  *to++ = '\n'; break;
419
      case 'r':  *to++ = '\r'; break;
420
      case '\\': *to++ = '\\'; break;
421
      default:
422
        corrupted(_p, "Unsupported character");
423
      }
424
    }
425
  }
426
  corrupted_if(n > 0, "Truncated"); // expected more chars but file has ended
427
  _p = from;
428
  skip_newline();
429
}
430

431
// NOTE: the content is NOT the same as
432
// UTF8::as_quoted_ascii(const char* utf8_str, int utf8_length, char* buf, int buflen).
433
// We want to escape \r\n\t so that output [1] is more readable; [2] can be more easily
434
// parsed by scripts; [3] quickly processed by HashtableTextDump::get_utf8()
435
void HashtableTextDump::put_utf8(outputStream* st, const char* utf8_string, int utf8_length) {
436
  const char *c = utf8_string;
437
  const char *end = c + utf8_length;
438
  for (; c < end; c++) {
439
    switch (*c) {
440
    case '\t': st->print("\\t"); break;
441
    case '\r': st->print("\\r"); break;
442
    case '\n': st->print("\\n"); break;
443
    case '\\': st->print("\\\\"); break;
444
    default:
445
      if (isprint(*c)) {
446
        st->print("%c", *c);
447
      } else {
448
        st->print("\\x%02x", ((unsigned int)*c) & 0xff);
449
      }
450
    }
451
  }
452
}
453

454
Product

Resources

Company