Groonga 3.0.9 Source Code Document
 All Data Structures Namespaces Files Functions Variables Typedefs Enumerations Enumerator Macros Pages
hash.c
Go to the documentation of this file.
1 /*
2 ** hash.c - Hash class
3 **
4 ** See Copyright Notice in mruby.h
5 */
6 
7 #include "mruby.h"
8 #include "mruby/array.h"
9 #include "mruby/class.h"
10 #include "mruby/hash.h"
11 #include "mruby/khash.h"
12 #include "mruby/string.h"
13 #include "mruby/variable.h"
14 
15 static inline khint_t
16 mrb_hash_ht_hash_func(mrb_state *mrb, mrb_value key)
17 {
18  khint_t h = (khint_t)mrb_type(key) << 24;
19  mrb_value h2;
20 
21  h2 = mrb_funcall(mrb, key, "hash", 0, 0);
22  h ^= h2.value.i;
23  return h;
24 }
25 
26 static inline khint_t
27 mrb_hash_ht_hash_equal(mrb_state *mrb, mrb_value a, mrb_value b)
28 {
29  return mrb_eql(mrb, a, b);
30 }
31 
33 KHASH_DEFINE (ht, mrb_value, mrb_value, 1, mrb_hash_ht_hash_func, mrb_hash_ht_hash_equal)
34 
35 static void mrb_hash_modify(mrb_state *mrb, mrb_value hash);
36 
37 static inline mrb_value
38 mrb_hash_ht_key(mrb_state *mrb, mrb_value key)
39 {
40  if (mrb_string_p(key))
41  return mrb_str_dup(mrb, key);
42  else
43  return key;
44 }
45 
46 #define KEY(key) mrb_hash_ht_key(mrb, key)
47 
48 void
49 mrb_gc_mark_hash(mrb_state *mrb, struct RHash *hash)
50 {
51  khiter_t k;
52  khash_t(ht) *h = hash->ht;
53 
54  if (!h) return;
55  for (k = kh_begin(h); k != kh_end(h); k++) {
56  if (kh_exist(h, k)) {
57  mrb_value key = kh_key(h, k);
58  mrb_value val = kh_value(h, k);
59 
60  mrb_gc_mark_value(mrb, key);
61  mrb_gc_mark_value(mrb, val);
62  }
63  }
64 }
65 
66 size_t
68 {
69  if (!hash->ht) return 0;
70  return kh_size(hash->ht)*2;
71 }
72 
73 void
74 mrb_gc_free_hash(mrb_state *mrb, struct RHash *hash)
75 {
76  if (hash->ht) kh_destroy(ht, hash->ht);
77 }
78 
79 
80 mrb_value
82 {
83  struct RHash *h;
84 
85  h = (struct RHash*)mrb_obj_alloc(mrb, MRB_TT_HASH, mrb->hash_class);
86  h->ht = kh_init(ht, mrb);
87  if (capa > 0) {
88  kh_resize(ht, h->ht, capa);
89  }
90  h->iv = 0;
91  return mrb_obj_value(h);
92 }
93 
94 mrb_value
96 {
97  return mrb_hash_new_capa(mrb, 0);
98 }
99 
100 mrb_value
101 mrb_hash_get(mrb_state *mrb, mrb_value hash, mrb_value key)
102 {
103  khash_t(ht) *h = RHASH_TBL(hash);
104  khiter_t k;
105 
106  if (h) {
107  k = kh_get(ht, h, key);
108  if (k != kh_end(h))
109  return kh_value(h, k);
110  }
111 
112  /* not found */
113  if (MRB_RHASH_PROCDEFAULT_P(hash)) {
114  return mrb_funcall(mrb, RHASH_PROCDEFAULT(hash), "call", 2, hash, key);
115  }
116  return RHASH_IFNONE(hash);
117 }
118 
119 mrb_value
120 mrb_hash_fetch(mrb_state *mrb, mrb_value hash, mrb_value key, mrb_value def)
121 {
122  khash_t(ht) *h = RHASH_TBL(hash);
123  khiter_t k;
124 
125  if (h) {
126  k = kh_get(ht, h, key);
127  if (k != kh_end(h))
128  return kh_value(h, k);
129  }
130 
131  /* not found */
132  return def;
133 }
134 
135 void
136 mrb_hash_set(mrb_state *mrb, mrb_value hash, mrb_value key, mrb_value val) /* mrb_hash_aset */
137 {
138  khash_t(ht) *h;
139  khiter_t k;
140 
141  mrb_hash_modify(mrb, hash);
142  h = RHASH_TBL(hash);
143 
144  if (!h) h = RHASH_TBL(hash) = kh_init(ht, mrb);
145  k = kh_get(ht, h, key);
146  if (k == kh_end(h)) {
147  /* expand */
148  int ai = mrb_gc_arena_save(mrb);
149  k = kh_put(ht, h, KEY(key));
150  mrb_gc_arena_restore(mrb, ai);
151  }
152 
153  kh_value(h, k) = val;
154  mrb_write_barrier(mrb, (struct RBasic*)RHASH(hash));
155  return;
156 }
157 
158 mrb_value
159 mrb_hash_dup(mrb_state *mrb, mrb_value hash)
160 {
161  struct RHash* ret;
162  khash_t(ht) *h, *ret_h;
163  khiter_t k, ret_k;
164 
165  h = RHASH_TBL(hash);
166  ret = (struct RHash*)mrb_obj_alloc(mrb, MRB_TT_HASH, mrb->hash_class);
167  ret->ht = kh_init(ht, mrb);
168 
169  if (kh_size(h) > 0) {
170  ret_h = ret->ht;
171 
172  for (k = kh_begin(h); k != kh_end(h); k++) {
173  if (kh_exist(h,k)) {
174  int ai = mrb_gc_arena_save(mrb);
175  ret_k = kh_put(ht, ret_h, KEY(kh_key(h,k)));
176  mrb_gc_arena_restore(mrb, ai);
177  kh_val(ret_h, ret_k) = kh_val(h,k);
178  }
179  }
180  }
181 
182  return mrb_obj_value(ret);
183 }
184 
185 mrb_value
186 mrb_check_hash_type(mrb_state *mrb, mrb_value hash)
187 {
188  return mrb_check_convert_type(mrb, hash, MRB_TT_HASH, "Hash", "to_hash");
189 }
190 
191 khash_t(ht) *
192 mrb_hash_tbl(mrb_state *mrb, mrb_value hash)
193 {
194  khash_t(ht) *h = RHASH_TBL(hash);
195 
196  if (!h) {
197  RHASH_TBL(hash) = kh_init(ht, mrb);
198  }
199  return h;
200 }
201 
202 static void
203 mrb_hash_modify(mrb_state *mrb, mrb_value hash)
204 {
205  mrb_hash_tbl(mrb, hash);
206 }
207 
208 /* 15.2.13.4.16 */
209 /*
210  * call-seq:
211  * Hash.new -> new_hash
212  * Hash.new(obj) -> new_hash
213  * Hash.new {|hash, key| block } -> new_hash
214  *
215  * Returns a new, empty hash. If this hash is subsequently accessed by
216  * a key that doesn't correspond to a hash entry, the value returned
217  * depends on the style of <code>new</code> used to create the hash. In
218  * the first form, the access returns <code>nil</code>. If
219  * <i>obj</i> is specified, this single object will be used for
220  * all <em>default values</em>. If a block is specified, it will be
221  * called with the hash object and the key, and should return the
222  * default value. It is the block's responsibility to store the value
223  * in the hash if required.
224  *
225  * h = Hash.new("Go Fish")
226  * h["a"] = 100
227  * h["b"] = 200
228  * h["a"] #=> 100
229  * h["c"] #=> "Go Fish"
230  * # The following alters the single default object
231  * h["c"].upcase! #=> "GO FISH"
232  * h["d"] #=> "GO FISH"
233  * h.keys #=> ["a", "b"]
234  *
235  * # While this creates a new default object each time
236  * h = Hash.new { |hash, key| hash[key] = "Go Fish: #{key}" }
237  * h["c"] #=> "Go Fish: c"
238  * h["c"].upcase! #=> "GO FISH: C"
239  * h["d"] #=> "Go Fish: d"
240  * h.keys #=> ["c", "d"]
241  *
242  */
243 
244 static mrb_value
245 mrb_hash_init_core(mrb_state *mrb, mrb_value hash)
246 {
247  mrb_value block, ifnone;
248  mrb_value *argv;
249  int argc;
250 
251  mrb_get_args(mrb, "o*", &block, &argv, &argc);
252  mrb_hash_modify(mrb, hash);
253  if (mrb_nil_p(block)) {
254  if (argc > 0) {
255  if (argc != 1) mrb_raise(mrb, E_ARGUMENT_ERROR, "wrong number of arguments");
256  ifnone = argv[0];
257  }
258  else {
259  ifnone = mrb_nil_value();
260  }
261  }
262  else {
263  if (argc > 0) {
264  mrb_raise(mrb, E_ARGUMENT_ERROR, "wrong number of arguments");
265  }
266  RHASH(hash)->flags |= MRB_HASH_PROC_DEFAULT;
267  ifnone = block;
268  }
269  mrb_iv_set(mrb, hash, mrb_intern2(mrb, "ifnone", 6), ifnone);
270  return hash;
271 }
272 
273 /*
274  * call-seq:
275  * Hash[ key, value, ... ] -> new_hash
276  * Hash[ [ [key, value], ... ] ] -> new_hash
277  * Hash[ object ] -> new_hash
278  *
279  * Creates a new hash populated with the given objects. Equivalent to
280  * the literal <code>{ <i>key</i> => <i>value</i>, ... }</code>. In the first
281  * form, keys and values occur in pairs, so there must be an even number of arguments.
282  * The second and third form take a single argument which is either
283  * an array of key-value pairs or an object convertible to a hash.
284  *
285  * Hash["a", 100, "b", 200] #=> {"a"=>100, "b"=>200}
286  * Hash[ [ ["a", 100], ["b", 200] ] ] #=> {"a"=>100, "b"=>200}
287  * Hash["a" => 100, "b" => 200] #=> {"a"=>100, "b"=>200}
288  */
289 
290 static mrb_value
291 to_hash(mrb_state *mrb, mrb_value hash)
292 {
293  return mrb_convert_type(mrb, hash, MRB_TT_HASH, "Hash", "to_hash");
294 }
295 
296 /*
297  * call-seq:
298  * Hash.try_convert(obj) -> hash or nil
299  *
300  * Try to convert <i>obj</i> into a hash, using to_hash method.
301  * Returns converted hash or nil if <i>obj</i> cannot be converted
302  * for any reason.
303  *
304  * Hash.try_convert({1=>2}) # => {1=>2}
305  * Hash.try_convert("1=>2") # => nil
306  */
307 
308 /* 15.2.13.4.2 */
309 /*
310  * call-seq:
311  * hsh[key] -> value
312  *
313  * Element Reference---Retrieves the <i>value</i> object corresponding
314  * to the <i>key</i> object. If not found, returns the default value (see
315  * <code>Hash::new</code> for details).
316  *
317  * h = { "a" => 100, "b" => 200 }
318  * h["a"] #=> 100
319  * h["c"] #=> nil
320  *
321  */
322 mrb_value
323 mrb_hash_aget(mrb_state *mrb, mrb_value self)
324 {
325  mrb_value key;
326 
327  mrb_get_args(mrb, "o", &key);
328  return mrb_hash_get(mrb, self, key);
329 }
330 
331 /*
332  * call-seq:
333  * hsh.fetch(key [, default] ) -> obj
334  * hsh.fetch(key) {| key | block } -> obj
335  *
336  * Returns a value from the hash for the given key. If the key can't be
337  * found, there are several options: With no other arguments, it will
338  * raise an <code>KeyError</code> exception; if <i>default</i> is
339  * given, then that will be returned; if the optional code block is
340  * specified, then that will be run and its result returned.
341  *
342  * h = { "a" => 100, "b" => 200 }
343  * h.fetch("a") #=> 100
344  * h.fetch("z", "go fish") #=> "go fish"
345  * h.fetch("z") { |el| "go fish, #{el}"} #=> "go fish, z"
346  *
347  * The following example shows that an exception is raised if the key
348  * is not found and a default value is not supplied.
349  *
350  * h = { "a" => 100, "b" => 200 }
351  * h.fetch("z")
352  *
353  * <em>produces:</em>
354  *
355  * prog.rb:2:in `fetch': key not found (KeyError)
356  * from prog.rb:2
357  *
358  */
359 
360 /* 15.2.13.4.5 */
361 /*
362  * call-seq:
363  * hsh.default(key=nil) -> obj
364  *
365  * Returns the default value, the value that would be returned by
366  * <i>hsh</i>[<i>key</i>] if <i>key</i> did not exist in <i>hsh</i>.
367  * See also <code>Hash::new</code> and <code>Hash#default=</code>.
368  *
369  * h = Hash.new #=> {}
370  * h.default #=> nil
371  * h.default(2) #=> nil
372  *
373  * h = Hash.new("cat") #=> {}
374  * h.default #=> "cat"
375  * h.default(2) #=> "cat"
376  *
377  * h = Hash.new {|h,k| h[k] = k.to_i*10} #=> {}
378  * h.default #=> nil
379  * h.default(2) #=> 20
380  */
381 
382 static mrb_value
383 mrb_hash_default(mrb_state *mrb, mrb_value hash)
384 {
385  mrb_value *argv;
386  int argc;
387  mrb_value key;
388 
389  mrb_get_args(mrb, "*", &argv, &argc);
390  if (MRB_RHASH_PROCDEFAULT_P(hash)) {
391  if (argc == 0) return mrb_nil_value();
392  key = argv[0];
393  return mrb_funcall(mrb, RHASH_PROCDEFAULT(hash), "call", 2, hash, key);
394  }
395  else {
396  return RHASH_IFNONE(hash);
397  }
398 }
399 
400 /* 15.2.13.4.6 */
401 /*
402  * call-seq:
403  * hsh.default = obj -> obj
404  *
405  * Sets the default value, the value returned for a key that does not
406  * exist in the hash. It is not possible to set the default to a
407  * <code>Proc</code> that will be executed on each key lookup.
408  *
409  * h = { "a" => 100, "b" => 200 }
410  * h.default = "Go fish"
411  * h["a"] #=> 100
412  * h["z"] #=> "Go fish"
413  * # This doesn't do what you might hope...
414  * h.default = proc do |hash, key|
415  * hash[key] = key + key
416  * end
417  * h[2] #=> #<Proc:0x401b3948@-:6>
418  * h["cat"] #=> #<Proc:0x401b3948@-:6>
419  */
420 
421 static mrb_value
422 mrb_hash_set_default(mrb_state *mrb, mrb_value hash)
423 {
424  mrb_value ifnone;
425 
426  mrb_get_args(mrb, "o", &ifnone);
427  mrb_hash_modify(mrb, hash);
428  mrb_iv_set(mrb, hash, mrb_intern2(mrb, "ifnone", 6), ifnone);
429  RHASH(hash)->flags &= ~(MRB_HASH_PROC_DEFAULT);
430 
431  return ifnone;
432 }
433 
434 /* 15.2.13.4.7 */
435 /*
436  * call-seq:
437  * hsh.default_proc -> anObject
438  *
439  * If <code>Hash::new</code> was invoked with a block, return that
440  * block, otherwise return <code>nil</code>.
441  *
442  * h = Hash.new {|h,k| h[k] = k*k } #=> {}
443  * p = h.default_proc #=> #<Proc:0x401b3d08@-:1>
444  * a = [] #=> []
445  * p.call(a, 2)
446  * a #=> [nil, nil, 4]
447  */
448 
449 
450 static mrb_value
451 mrb_hash_default_proc(mrb_state *mrb, mrb_value hash)
452 {
453  if (MRB_RHASH_PROCDEFAULT_P(hash)) {
454  return RHASH_PROCDEFAULT(hash);
455  }
456  return mrb_nil_value();
457 }
458 
459 /*
460  * call-seq:
461  * hsh.default_proc = proc_obj -> proc_obj
462  *
463  * Sets the default proc to be executed on each key lookup.
464  *
465  * h.default_proc = proc do |hash, key|
466  * hash[key] = key + key
467  * end
468  * h[2] #=> 4
469  * h["cat"] #=> "catcat"
470  */
471 
472 static mrb_value
473 mrb_hash_set_default_proc(mrb_state *mrb, mrb_value hash)
474 {
475  mrb_value ifnone;
476 
477  mrb_get_args(mrb, "o", &ifnone);
478  mrb_hash_modify(mrb, hash);
479  mrb_iv_set(mrb, hash, mrb_intern2(mrb, "ifnone", 6), ifnone);
480  RHASH(hash)->flags |= MRB_HASH_PROC_DEFAULT;
481 
482  return ifnone;
483 }
484 
485 mrb_value
486 mrb_hash_delete_key(mrb_state *mrb, mrb_value hash, mrb_value key)
487 {
488  khash_t(ht) *h = RHASH_TBL(hash);
489  khiter_t k;
490  mrb_value delVal;
491 
492  if (h) {
493  k = kh_get(ht, h, key);
494  if (k != kh_end(h)) {
495  delVal = kh_value(h, k);
496  kh_del(ht, h, k);
497  return delVal;
498  }
499  }
500 
501  /* not found */
502  return mrb_nil_value();
503 }
504 
505 /* 15.2.13.4.8 */
506 /*
507  * call-seq:
508  * hsh.delete(key) -> value
509  * hsh.delete(key) {| key | block } -> value
510  *
511  * Deletes and returns a key-value pair from <i>hsh</i> whose key is
512  * equal to <i>key</i>. If the key is not found, returns the
513  * <em>default value</em>. If the optional code block is given and the
514  * key is not found, pass in the key and return the result of
515  * <i>block</i>.
516  *
517  * h = { "a" => 100, "b" => 200 }
518  * h.delete("a") #=> 100
519  * h.delete("z") #=> nil
520  * h.delete("z") { |el| "#{el} not found" } #=> "z not found"
521  *
522  */
523 mrb_value
524 mrb_hash_delete(mrb_state *mrb, mrb_value self)
525 {
526  mrb_value key;
527 
528  mrb_get_args(mrb, "o", &key);
529  return mrb_hash_delete_key(mrb, self, key);
530 }
531 
532 /* 15.2.13.4.24 */
533 /*
534  * call-seq:
535  * hsh.shift -> anArray or obj
536  *
537  * Removes a key-value pair from <i>hsh</i> and returns it as the
538  * two-item array <code>[</code> <i>key, value</i> <code>]</code>, or
539  * the hash's default value if the hash is empty.
540  *
541  * h = { 1 => "a", 2 => "b", 3 => "c" }
542  * h.shift #=> [1, "a"]
543  * h #=> {2=>"b", 3=>"c"}
544  */
545 
546 static mrb_value
547 mrb_hash_shift(mrb_state *mrb, mrb_value hash)
548 {
549  khash_t(ht) *h = RHASH_TBL(hash);
550  khiter_t k;
551  mrb_value delKey, delVal;
552 
553  mrb_hash_modify(mrb, hash);
554  if (h) {
555  if (kh_size(h) > 0) {
556  for (k = kh_begin(h); k != kh_end(h); k++) {
557  if (!kh_exist(h,k)) continue;
558 
559  delKey = kh_key(h,k);
560  mrb_gc_protect(mrb, delKey);
561  delVal = mrb_hash_delete_key(mrb, hash, delKey);
562  mrb_gc_protect(mrb, delVal);
563 
564  return mrb_assoc_new(mrb, delKey, delVal);
565  }
566  }
567  }
568 
569  if (MRB_RHASH_PROCDEFAULT_P(hash)) {
570  return mrb_funcall(mrb, RHASH_PROCDEFAULT(hash), "call", 2, hash, mrb_nil_value());
571  }
572  else {
573  return RHASH_IFNONE(hash);
574  }
575 }
576 
577 /*
578  * call-seq:
579  * hsh.delete_if {| key, value | block } -> hsh
580  * hsh.delete_if -> an_enumerator
581  *
582  * Deletes every key-value pair from <i>hsh</i> for which <i>block</i>
583  * evaluates to <code>true</code>.
584  *
585  * If no block is given, an enumerator is returned instead.
586  *
587  * h = { "a" => 100, "b" => 200, "c" => 300 }
588  * h.delete_if {|key, value| key >= "b" } #=> {"a"=>100}
589  *
590  */
591 
592 /*
593  * call-seq:
594  * hsh.reject! {| key, value | block } -> hsh or nil
595  * hsh.reject! -> an_enumerator
596  *
597  * Equivalent to <code>Hash#delete_if</code>, but returns
598  * <code>nil</code> if no changes were made.
599  */
600 
601 /*
602  * call-seq:
603  * hsh.reject {| key, value | block } -> a_hash
604  *
605  * Same as <code>Hash#delete_if</code>, but works on (and returns) a
606  * copy of the <i>hsh</i>. Equivalent to
607  * <code><i>hsh</i>.dup.delete_if</code>.
608  *
609  */
610 
611 /*
612  * call-seq:
613  * hsh.select {|key, value| block} -> a_hash
614  * hsh.select -> an_enumerator
615  *
616  * Returns a new hash consisting of entries for which the block returns true.
617  *
618  * If no block is given, an enumerator is returned instead.
619  *
620  * h = { "a" => 100, "b" => 200, "c" => 300 }
621  * h.select {|k,v| k > "a"} #=> {"b" => 200, "c" => 300}
622  * h.select {|k,v| v < 200} #=> {"a" => 100}
623  */
624 
625 /*
626  * call-seq:
627  * hsh.select! {| key, value | block } -> hsh or nil
628  * hsh.select! -> an_enumerator
629  *
630  * Equivalent to <code>Hash#keep_if</code>, but returns
631  * <code>nil</code> if no changes were made.
632  */
633 
634 /*
635  * call-seq:
636  * hsh.keep_if {| key, value | block } -> hsh
637  * hsh.keep_if -> an_enumerator
638  *
639  * Deletes every key-value pair from <i>hsh</i> for which <i>block</i>
640  * evaluates to false.
641  *
642  * If no block is given, an enumerator is returned instead.
643  *
644  */
645 
646 /* 15.2.13.4.4 */
647 /*
648  * call-seq:
649  * hsh.clear -> hsh
650  *
651  * Removes all key-value pairs from <i>hsh</i>.
652  *
653  * h = { "a" => 100, "b" => 200 } #=> {"a"=>100, "b"=>200}
654  * h.clear #=> {}
655  *
656  */
657 
658 mrb_value
659 mrb_hash_clear(mrb_state *mrb, mrb_value hash)
660 {
661  khash_t(ht) *h = RHASH_TBL(hash);
662 
663  if (h) kh_clear(ht, h);
664  return hash;
665 }
666 
667 /* 15.2.13.4.3 */
668 /* 15.2.13.4.26 */
669 /*
670  * call-seq:
671  * hsh[key] = value -> value
672  * hsh.store(key, value) -> value
673  *
674  * Element Assignment---Associates the value given by
675  * <i>value</i> with the key given by <i>key</i>.
676  * <i>key</i> should not have its value changed while it is in
677  * use as a key (a <code>String</code> passed as a key will be
678  * duplicated and frozen).
679  *
680  * h = { "a" => 100, "b" => 200 }
681  * h["a"] = 9
682  * h["c"] = 4
683  * h #=> {"a"=>9, "b"=>200, "c"=>4}
684  *
685  */
686 mrb_value
687 mrb_hash_aset(mrb_state *mrb, mrb_value self)
688 {
689  mrb_value key, val;
690 
691  mrb_get_args(mrb, "oo", &key, &val);
692  mrb_hash_set(mrb, self, key, val);
693  return val;
694 }
695 
696 /* 15.2.13.4.17 */
697 /* 15.2.13.4.23 */
698 /*
699  * call-seq:
700  * hsh.replace(other_hash) -> hsh
701  *
702  * Replaces the contents of <i>hsh</i> with the contents of
703  * <i>other_hash</i>.
704  *
705  * h = { "a" => 100, "b" => 200 }
706  * h.replace({ "c" => 300, "d" => 400 }) #=> {"c"=>300, "d"=>400}
707  *
708  */
709 
710 static mrb_value
711 mrb_hash_replace(mrb_state *mrb, mrb_value hash)
712 {
713  mrb_value hash2, ifnone;
714  khash_t(ht) *h2;
715  khiter_t k;
716 
717  mrb_get_args(mrb, "o", &hash2);
718  hash2 = to_hash(mrb, hash2);
719  if (mrb_obj_equal(mrb, hash, hash2)) return hash;
720  mrb_hash_clear(mrb, hash);
721 
722  h2 = RHASH_TBL(hash2);
723  if (h2) {
724  for (k = kh_begin(h2); k != kh_end(h2); k++) {
725  if (kh_exist(h2, k))
726  mrb_hash_set(mrb, hash, kh_key(h2, k), kh_value(h2, k));
727  }
728  }
729 
730  if (MRB_RHASH_PROCDEFAULT_P(hash2)) {
731  RHASH(hash)->flags |= MRB_HASH_PROC_DEFAULT;
732  ifnone = RHASH_PROCDEFAULT(hash2);
733  }
734  else {
735  ifnone = RHASH_IFNONE(hash2);
736  }
737  mrb_iv_set(mrb, hash, mrb_intern2(mrb, "ifnone", 6), ifnone);
738 
739  return hash;
740 }
741 
742 /* 15.2.13.4.20 */
743 /* 15.2.13.4.25 */
744 /*
745  * call-seq:
746  * hsh.length -> fixnum
747  * hsh.size -> fixnum
748  *
749  * Returns the number of key-value pairs in the hash.
750  *
751  * h = { "d" => 100, "a" => 200, "v" => 300, "e" => 400 }
752  * h.length #=> 4
753  * h.delete("a") #=> 200
754  * h.length #=> 3
755  */
756 static mrb_value
757 mrb_hash_size_m(mrb_state *mrb, mrb_value self)
758 {
759  khash_t(ht) *h = RHASH_TBL(self);
760 
761  if (!h) return mrb_fixnum_value(0);
762  return mrb_fixnum_value(kh_size(h));
763 }
764 
765 /* 15.2.13.4.12 */
766 /*
767  * call-seq:
768  * hsh.empty? -> true or false
769  *
770  * Returns <code>true</code> if <i>hsh</i> contains no key-value pairs.
771  *
772  * {}.empty? #=> true
773  *
774  */
775 mrb_value
776 mrb_hash_empty_p(mrb_state *mrb, mrb_value self)
777 {
778  khash_t(ht) *h = RHASH_TBL(self);
779 
780  if (h) return mrb_bool_value(kh_size(h) == 0);
781  return mrb_true_value();
782 }
783 
784 static mrb_value
785 inspect_hash(mrb_state *mrb, mrb_value hash, int recur)
786 {
787  mrb_value str, str2;
788  khash_t(ht) *h = RHASH_TBL(hash);
789  khiter_t k;
790 
791  if (recur) return mrb_str_new(mrb, "{...}", 5);
792 
793  str = mrb_str_new(mrb, "{", 1);
794  if (h && kh_size(h) > 0) {
795  for (k = kh_begin(h); k != kh_end(h); k++) {
796  int ai;
797 
798  if (!kh_exist(h,k)) continue;
799 
800  ai = mrb_gc_arena_save(mrb);
801 
802  if (RSTRING_LEN(str) > 1) mrb_str_cat(mrb, str, ", ", 2);
803 
804  str2 = mrb_inspect(mrb, kh_key(h,k));
805  mrb_str_append(mrb, str, str2);
806  mrb_str_buf_cat(mrb, str, "=>", 2);
807  str2 = mrb_inspect(mrb, kh_value(h,k));
808  mrb_str_append(mrb, str, str2);
809 
810  mrb_gc_arena_restore(mrb, ai);
811  }
812  }
813  mrb_str_buf_cat(mrb, str, "}", 1);
814 
815  return str;
816 }
817 
818 /* 15.2.13.4.30 (x)*/
819 /*
820  * call-seq:
821  * hsh.to_s -> string
822  * hsh.inspect -> string
823  *
824  * Return the contents of this hash as a string.
825  *
826  * h = { "c" => 300, "a" => 100, "d" => 400, "c" => 300 }
827  * h.to_s #=> "{\"c\"=>300, \"a\"=>100, \"d\"=>400}"
828  */
829 
830 static mrb_value
831 mrb_hash_inspect(mrb_state *mrb, mrb_value hash)
832 {
833  khash_t(ht) *h = RHASH_TBL(hash);
834 
835  if (!h || kh_size(h) == 0)
836  return mrb_str_new(mrb, "{}", 2);
837  return inspect_hash(mrb, hash, 0);
838 }
839 
840 /* 15.2.13.4.29 (x)*/
841 /*
842  * call-seq:
843  * hsh.to_hash => hsh
844  *
845  * Returns +self+.
846  */
847 
848 static mrb_value
849 mrb_hash_to_hash(mrb_state *mrb, mrb_value hash)
850 {
851  return hash;
852 }
853 
854 /* 15.2.13.4.19 */
855 /*
856  * call-seq:
857  * hsh.keys -> array
858  *
859  * Returns a new array populated with the keys from this hash. See also
860  * <code>Hash#values</code>.
861  *
862  * h = { "a" => 100, "b" => 200, "c" => 300, "d" => 400 }
863  * h.keys #=> ["a", "b", "c", "d"]
864  *
865  */
866 
867 mrb_value
868 mrb_hash_keys(mrb_state *mrb, mrb_value hash)
869 {
870  khash_t(ht) *h = RHASH_TBL(hash);
871  khiter_t k;
872  mrb_value ary;
873 
874  if (!h) return mrb_ary_new(mrb);
875  ary = mrb_ary_new_capa(mrb, kh_size(h));
876  for (k = kh_begin(h); k != kh_end(h); k++) {
877  if (kh_exist(h, k)) {
878  mrb_value v = kh_key(h,k);
879  mrb_ary_push(mrb, ary, v);
880  }
881  }
882  return ary;
883 }
884 
885 /* 15.2.13.4.28 */
886 /*
887  * call-seq:
888  * hsh.values -> array
889  *
890  * Returns a new array populated with the values from <i>hsh</i>. See
891  * also <code>Hash#keys</code>.
892  *
893  * h = { "a" => 100, "b" => 200, "c" => 300 }
894  * h.values #=> [100, 200, 300]
895  *
896  */
897 
898 static mrb_value
899 mrb_hash_values(mrb_state *mrb, mrb_value hash)
900 {
901  khash_t(ht) *h = RHASH_TBL(hash);
902  khiter_t k;
903  mrb_value ary;
904 
905  if (!h) return mrb_ary_new(mrb);
906  ary = mrb_ary_new_capa(mrb, kh_size(h));
907  for (k = kh_begin(h); k != kh_end(h); k++) {
908  if (kh_exist(h, k)){
909  mrb_value v = kh_value(h,k);
910  mrb_ary_push(mrb, ary, v);
911  }
912  }
913  return ary;
914 }
915 
916 static mrb_value
917 mrb_hash_has_keyWithKey(mrb_state *mrb, mrb_value hash, mrb_value key)
918 {
919  khash_t(ht) *h = RHASH_TBL(hash);
920  khiter_t k;
921 
922  if (h) {
923  k = kh_get(ht, h, key);
924  return mrb_bool_value(k != kh_end(h));
925  }
926  return mrb_false_value();
927 }
928 
929 /* 15.2.13.4.13 */
930 /* 15.2.13.4.15 */
931 /* 15.2.13.4.18 */
932 /* 15.2.13.4.21 */
933 /*
934  * call-seq:
935  * hsh.has_key?(key) -> true or false
936  * hsh.include?(key) -> true or false
937  * hsh.key?(key) -> true or false
938  * hsh.member?(key) -> true or false
939  *
940  * Returns <code>true</code> if the given key is present in <i>hsh</i>.
941  *
942  * h = { "a" => 100, "b" => 200 }
943  * h.has_key?("a") #=> true
944  * h.has_key?("z") #=> false
945  *
946  */
947 
948 static mrb_value
949 mrb_hash_has_key(mrb_state *mrb, mrb_value hash)
950 {
951  mrb_value key;
952 
953  mrb_get_args(mrb, "o", &key);
954  return mrb_hash_has_keyWithKey(mrb, hash, key);
955 }
956 
957 static mrb_value
958 mrb_hash_has_valueWithvalue(mrb_state *mrb, mrb_value hash, mrb_value value)
959 {
960  khash_t(ht) *h = RHASH_TBL(hash);
961  khiter_t k;
962 
963  if (h) {
964  for (k = kh_begin(h); k != kh_end(h); k++) {
965  if (!kh_exist(h, k)) continue;
966 
967  if (mrb_equal(mrb, kh_value(h,k), value)) {
968  return mrb_true_value();
969  }
970  }
971  }
972 
973  return mrb_false_value();
974 }
975 
976 /* 15.2.13.4.14 */
977 /* 15.2.13.4.27 */
978 /*
979  * call-seq:
980  * hsh.has_value?(value) -> true or false
981  * hsh.value?(value) -> true or false
982  *
983  * Returns <code>true</code> if the given value is present for some key
984  * in <i>hsh</i>.
985  *
986  * h = { "a" => 100, "b" => 200 }
987  * h.has_value?(100) #=> true
988  * h.has_value?(999) #=> false
989  */
990 
991 static mrb_value
992 mrb_hash_has_value(mrb_state *mrb, mrb_value hash)
993 {
994  mrb_value val;
995 
996  mrb_get_args(mrb, "o", &val);
997  return mrb_hash_has_valueWithvalue(mrb, hash, val);
998 }
999 
1000 static mrb_value
1001 hash_equal(mrb_state *mrb, mrb_value hash1, mrb_value hash2, int eql)
1002 {
1003  khash_t(ht) *h1, *h2;
1004 
1005  if (mrb_obj_equal(mrb, hash1, hash2)) return mrb_true_value();
1006  if (!mrb_hash_p(hash2)) {
1007  if (!mrb_respond_to(mrb, hash2, mrb_intern2(mrb, "to_hash", 7))) {
1008  return mrb_false_value();
1009  }
1010  if (eql)
1011  return mrb_fixnum_value(mrb_eql(mrb, hash2, hash1));
1012  else
1013  return mrb_fixnum_value(mrb_equal(mrb, hash2, hash1));
1014  }
1015  h1 = RHASH_TBL(hash1);
1016  h2 = RHASH_TBL(hash2);
1017  if (!h1) {
1018  return mrb_bool_value(!h2);
1019  }
1020  if (!h2) return mrb_false_value();
1021  if (kh_size(h1) != kh_size(h2)) return mrb_false_value();
1022  else {
1023  khiter_t k1, k2;
1024  mrb_value key;
1025 
1026  for (k1 = kh_begin(h1); k1 != kh_end(h1); k1++) {
1027  if (!kh_exist(h1, k1)) continue;
1028  key = kh_key(h1,k1);
1029  k2 = kh_get(ht, h2, key);
1030  if (k2 != kh_end(h2)) {
1031  if (mrb_equal(mrb, kh_value(h1,k1), kh_value(h2,k2))) {
1032  continue; /* next key */
1033  }
1034  }
1035  return mrb_false_value();
1036  }
1037  }
1038  return mrb_true_value();
1039 }
1040 
1041 /* 15.2.13.4.1 */
1042 /*
1043  * call-seq:
1044  * hsh == other_hash -> true or false
1045  *
1046  * Equality---Two hashes are equal if they each contain the same number
1047  * of keys and if each key-value pair is equal to (according to
1048  * <code>Object#==</code>) the corresponding elements in the other
1049  * hash.
1050  *
1051  * h1 = { "a" => 1, "c" => 2 }
1052  * h2 = { 7 => 35, "c" => 2, "a" => 1 }
1053  * h3 = { "a" => 1, "c" => 2, 7 => 35 }
1054  * h4 = { "a" => 1, "d" => 2, "f" => 35 }
1055  * h1 == h2 #=> false
1056  * h2 == h3 #=> true
1057  * h3 == h4 #=> false
1058  *
1059  */
1060 
1061 static mrb_value
1062 mrb_hash_equal(mrb_state *mrb, mrb_value hash1)
1063 {
1064  mrb_value hash2;
1065 
1066  mrb_get_args(mrb, "o", &hash2);
1067  return hash_equal(mrb, hash1, hash2, FALSE);
1068 }
1069 
1070 /* 15.2.13.4.32 (x)*/
1071 /*
1072  * call-seq:
1073  * hash.eql?(other) -> true or false
1074  *
1075  * Returns <code>true</code> if <i>hash</i> and <i>other</i> are
1076  * both hashes with the same content.
1077  */
1078 
1079 static mrb_value
1080 mrb_hash_eql(mrb_state *mrb, mrb_value hash1)
1081 {
1082  mrb_value hash2;
1083 
1084  mrb_get_args(mrb, "o", &hash2);
1085  return hash_equal(mrb, hash1, hash2, TRUE);
1086 }
1087 
1088 /*
1089  * call-seq:
1090  * hsh.merge!(other_hash) -> hsh
1091  * hsh.update(other_hash) -> hsh
1092  * hsh.merge!(other_hash){|key, oldval, newval| block} -> hsh
1093  * hsh.update(other_hash){|key, oldval, newval| block} -> hsh
1094  *
1095  * Adds the contents of <i>other_hash</i> to <i>hsh</i>. If no
1096  * block is specified, entries with duplicate keys are overwritten
1097  * with the values from <i>other_hash</i>, otherwise the value
1098  * of each duplicate key is determined by calling the block with
1099  * the key, its value in <i>hsh</i> and its value in <i>other_hash</i>.
1100  *
1101  * h1 = { "a" => 100, "b" => 200 }
1102  * h2 = { "b" => 254, "c" => 300 }
1103  * h1.merge!(h2) #=> {"a"=>100, "b"=>254, "c"=>300}
1104  *
1105  * h1 = { "a" => 100, "b" => 200 }
1106  * h2 = { "b" => 254, "c" => 300 }
1107  * h1.merge!(h2) { |key, v1, v2| v1 }
1108  * #=> {"a"=>100, "b"=>200, "c"=>300}
1109  */
1110 
1111 /* 15.2.13.4.22 */
1112 /*
1113  * call-seq:
1114  * hsh.merge(other_hash) -> new_hash
1115  * hsh.merge(other_hash){|key, oldval, newval| block} -> new_hash
1116  *
1117  * Returns a new hash containing the contents of <i>other_hash</i> and
1118  * the contents of <i>hsh</i>. If no block is specified, the value for
1119  * entries with duplicate keys will be that of <i>other_hash</i>. Otherwise
1120  * the value for each duplicate key is determined by calling the block
1121  * with the key, its value in <i>hsh</i> and its value in <i>other_hash</i>.
1122  *
1123  * h1 = { "a" => 100, "b" => 200 }
1124  * h2 = { "b" => 254, "c" => 300 }
1125  * h1.merge(h2) #=> {"a"=>100, "b"=>254, "c"=>300}
1126  * h1.merge(h2){|key, oldval, newval| newval - oldval}
1127  * #=> {"a"=>100, "b"=>54, "c"=>300}
1128  * h1 #=> {"a"=>100, "b"=>200}
1129  *
1130  */
1131 
1132 /*
1133  * call-seq:
1134  * hash.assoc(obj) -> an_array or nil
1135  *
1136  * Searches through the hash comparing _obj_ with the key using <code>==</code>.
1137  * Returns the key-value pair (two elements array) or +nil+
1138  * if no match is found. See <code>Array#assoc</code>.
1139  *
1140  * h = {"colors" => ["red", "blue", "green"],
1141  * "letters" => ["a", "b", "c" ]}
1142  * h.assoc("letters") #=> ["letters", ["a", "b", "c"]]
1143  * h.assoc("foo") #=> nil
1144  */
1145 
1146 mrb_value
1147 mrb_hash_assoc(mrb_state *mrb, mrb_value hash)
1148 {
1149  mrb_value key, value, has_key;
1150 
1151  mrb_get_args(mrb, "o", &key);
1152  if (mrb_nil_p(key))
1153  mrb_raise(mrb, E_ARGUMENT_ERROR, "wrong number of arguments");
1154 
1155  has_key = mrb_hash_has_keyWithKey(mrb, hash, key);
1156  if (mrb_test(has_key)) {
1157  value = mrb_hash_get(mrb, hash, key);
1158  return mrb_assoc_new(mrb, key, value);
1159  }
1160  else {
1161  return mrb_nil_value();
1162  }
1163 }
1164 
1165 /*
1166  * call-seq:
1167  * hash.rassoc(key) -> an_array or nil
1168  *
1169  * Searches through the hash comparing _obj_ with the value using <code>==</code>.
1170  * Returns the first key-value pair (two-element array) that matches. See
1171  * also <code>Array#rassoc</code>.
1172  *
1173  * a = {1=> "one", 2 => "two", 3 => "three", "ii" => "two"}
1174  * a.rassoc("two") #=> [2, "two"]
1175  * a.rassoc("four") #=> nil
1176  */
1177 
1178 mrb_value
1179 mrb_hash_rassoc(mrb_state *mrb, mrb_value hash)
1180 {
1181  mrb_value key, value, has_key;
1182 
1183  mrb_get_args(mrb, "o", &key);
1184  has_key = mrb_hash_has_keyWithKey(mrb, hash, key);
1185  if (mrb_test(has_key)) {
1186  value = mrb_hash_get(mrb, hash, key);
1187  return mrb_assoc_new(mrb, value, key);
1188  }
1189  else {
1190  return mrb_nil_value();
1191  }
1192 }
1193 
1194 /*
1195  * call-seq:
1196  * hash.flatten -> an_array
1197  * hash.flatten(level) -> an_array
1198  *
1199  * Returns a new array that is a one-dimensional flattening of this
1200  * hash. That is, for every key or value that is an array, extract
1201  * its elements into the new array. Unlike Array#flatten, this
1202  * method does not flatten recursively by default. The optional
1203  * <i>level</i> argument determines the level of recursion to flatten.
1204  *
1205  * a = {1=> "one", 2 => [2,"two"], 3 => "three"}
1206  * a.flatten # => [1, "one", 2, [2, "two"], 3, "three"]
1207  * a.flatten(2) # => [1, "one", 2, 2, "two", 3, "three"]
1208  */
1209 
1210 /*
1211  * A <code>Hash</code> is a collection of key-value pairs. It is
1212  * similar to an <code>Array</code>, except that indexing is done via
1213  * arbitrary keys of any object type, not an integer index. Hashes enumerate
1214  * their values in the order that the corresponding keys were inserted.
1215  *
1216  * Hashes have a <em>default value</em> that is returned when accessing
1217  * keys that do not exist in the hash. By default, that value is
1218  * <code>nil</code>.
1219  *
1220  */
1221 
1222 void
1224 {
1225  struct RClass *h;
1226 
1227  h = mrb->hash_class = mrb_define_class(mrb, "Hash", mrb->object_class);
1229 
1230  mrb_include_module(mrb, h, mrb_class_get(mrb, "Enumerable"));
1231  mrb_define_method(mrb, h, "==", mrb_hash_equal, MRB_ARGS_REQ(1)); /* 15.2.13.4.1 */
1232  mrb_define_method(mrb, h, "[]", mrb_hash_aget, MRB_ARGS_REQ(1)); /* 15.2.13.4.2 */
1233  mrb_define_method(mrb, h, "[]=", mrb_hash_aset, MRB_ARGS_REQ(2)); /* 15.2.13.4.3 */
1234  mrb_define_method(mrb, h, "clear", mrb_hash_clear, MRB_ARGS_NONE()); /* 15.2.13.4.4 */
1235  mrb_define_method(mrb, h, "default", mrb_hash_default, MRB_ARGS_ANY()); /* 15.2.13.4.5 */
1236  mrb_define_method(mrb, h, "default=", mrb_hash_set_default, MRB_ARGS_REQ(1)); /* 15.2.13.4.6 */
1237  mrb_define_method(mrb, h, "default_proc", mrb_hash_default_proc,MRB_ARGS_NONE()); /* 15.2.13.4.7 */
1238  mrb_define_method(mrb, h, "default_proc=", mrb_hash_set_default_proc,MRB_ARGS_REQ(1)); /* 15.2.13.4.7 */
1239  mrb_define_method(mrb, h, "__delete", mrb_hash_delete, MRB_ARGS_REQ(1)); /* core of 15.2.13.4.8 */
1240  mrb_define_method(mrb, h, "empty?", mrb_hash_empty_p, MRB_ARGS_NONE()); /* 15.2.13.4.12 */
1241  mrb_define_method(mrb, h, "has_key?", mrb_hash_has_key, MRB_ARGS_REQ(1)); /* 15.2.13.4.13 */
1242  mrb_define_method(mrb, h, "has_value?", mrb_hash_has_value, MRB_ARGS_REQ(1)); /* 15.2.13.4.14 */
1243  mrb_define_method(mrb, h, "include?", mrb_hash_has_key, MRB_ARGS_REQ(1)); /* 15.2.13.4.15 */
1244  mrb_define_method(mrb, h, "__init_core", mrb_hash_init_core, MRB_ARGS_ANY()); /* core of 15.2.13.4.16 */
1245  mrb_define_method(mrb, h, "initialize_copy", mrb_hash_replace, MRB_ARGS_REQ(1)); /* 15.2.13.4.17 */
1246  mrb_define_method(mrb, h, "key?", mrb_hash_has_key, MRB_ARGS_REQ(1)); /* 15.2.13.4.18 */
1247  mrb_define_method(mrb, h, "keys", mrb_hash_keys, MRB_ARGS_NONE()); /* 15.2.13.4.19 */
1248  mrb_define_method(mrb, h, "length", mrb_hash_size_m, MRB_ARGS_NONE()); /* 15.2.13.4.20 */
1249  mrb_define_method(mrb, h, "member?", mrb_hash_has_key, MRB_ARGS_REQ(1)); /* 15.2.13.4.21 */
1250  mrb_define_method(mrb, h, "replace", mrb_hash_replace, MRB_ARGS_REQ(1)); /* 15.2.13.4.23 */
1251  mrb_define_method(mrb, h, "shift", mrb_hash_shift, MRB_ARGS_NONE()); /* 15.2.13.4.24 */
1252  mrb_define_method(mrb, h, "size", mrb_hash_size_m, MRB_ARGS_NONE()); /* 15.2.13.4.25 */
1253  mrb_define_method(mrb, h, "store", mrb_hash_aset, MRB_ARGS_REQ(2)); /* 15.2.13.4.26 */
1254  mrb_define_method(mrb, h, "value?", mrb_hash_has_value, MRB_ARGS_REQ(1)); /* 15.2.13.4.27 */
1255  mrb_define_method(mrb, h, "values", mrb_hash_values, MRB_ARGS_NONE()); /* 15.2.13.4.28 */
1256 
1257  mrb_define_method(mrb, h, "to_hash", mrb_hash_to_hash, MRB_ARGS_NONE()); /* 15.2.13.4.29 (x)*/
1258  mrb_define_method(mrb, h, "inspect", mrb_hash_inspect, MRB_ARGS_NONE()); /* 15.2.13.4.30 (x)*/
1259  mrb_define_alias(mrb, h, "to_s", "inspect"); /* 15.2.13.4.31 (x)*/
1260  mrb_define_method(mrb, h, "eql?", mrb_hash_eql, MRB_ARGS_REQ(1)); /* 15.2.13.4.32 (x)*/
1261 }