1 | /* The size of the shared strings hashtable. This must be smaller than |
1 | #ifndef SHSTR_H__ |
2 | * 32767, but 947 ought to be plenty enough. |
2 | #define SHSTR_H__ |
3 | */ |
|
|
4 | #define TABLESIZE 4133 |
|
|
5 | |
3 | |
6 | /* This specifies how many characters the hashing routine should look at. |
4 | #include <sstream> |
7 | * You may actually save CPU by increasing this number if the typical string |
5 | |
8 | * is large. |
6 | #include "util.h" |
9 | */ |
7 | |
10 | #ifndef MAXSTRING |
8 | extern int buf_overflow (const char *buf1, const char *buf2, int bufsize); |
11 | #define MAXSTRING 20 |
9 | |
|
|
10 | struct shstr |
|
|
11 | { |
|
|
12 | static const char *null; |
|
|
13 | |
|
|
14 | const char *s; |
|
|
15 | |
|
|
16 | static int &refcnt (const char *s) |
|
|
17 | { |
|
|
18 | return *((int *)s - 1); |
|
|
19 | } |
|
|
20 | |
|
|
21 | static int &length (const char *s) |
|
|
22 | { |
|
|
23 | return *((int *)s - 2); |
|
|
24 | } |
|
|
25 | |
|
|
26 | int &refcnt () const |
|
|
27 | { |
|
|
28 | return refcnt (s); |
|
|
29 | } |
|
|
30 | |
|
|
31 | int length () const |
|
|
32 | { |
|
|
33 | return length (s); |
|
|
34 | } |
|
|
35 | |
|
|
36 | static const char *find (const char *s); |
|
|
37 | static const char *intern (const char *s); |
|
|
38 | |
|
|
39 | static void gc (); // garbage collect a few strings |
|
|
40 | |
|
|
41 | // this is used for informational messages and the like |
|
|
42 | const char *operator &() const { return s; } |
|
|
43 | |
|
|
44 | const char &operator [](int i) const { return s[i]; } |
|
|
45 | operator const char *() const { return s == null ? 0 : s; } |
|
|
46 | |
|
|
47 | shstr () |
|
|
48 | : s (null) |
|
|
49 | { |
|
|
50 | } |
|
|
51 | |
|
|
52 | shstr (const shstr &sh) |
|
|
53 | : s (sh.s) |
|
|
54 | { |
|
|
55 | ++refcnt (); |
|
|
56 | } |
|
|
57 | |
|
|
58 | explicit shstr (const char *s) |
|
|
59 | : s (intern (s)) |
|
|
60 | { |
|
|
61 | } |
|
|
62 | |
|
|
63 | ~shstr () |
|
|
64 | { |
|
|
65 | --refcnt (); |
|
|
66 | } |
|
|
67 | |
|
|
68 | const shstr &operator =(const shstr &sh) |
|
|
69 | { |
|
|
70 | --refcnt (); |
|
|
71 | s = sh.s; |
|
|
72 | ++refcnt (); |
|
|
73 | |
|
|
74 | return *this; |
|
|
75 | } |
|
|
76 | |
|
|
77 | const shstr &operator =(const char *str) |
|
|
78 | { |
|
|
79 | --refcnt (); |
|
|
80 | |
|
|
81 | // this optimises the important case of str == constant 0 |
|
|
82 | if (is_constant (str)) |
|
|
83 | s = str ? intern (str) : null; |
|
|
84 | else |
|
|
85 | s = intern (str); |
|
|
86 | |
|
|
87 | return *this; |
|
|
88 | } |
|
|
89 | |
|
|
90 | bool operator ==(const shstr &b) |
|
|
91 | { |
|
|
92 | return s == b.s; |
|
|
93 | } |
|
|
94 | |
|
|
95 | bool operator !=(const shstr &b) |
|
|
96 | { |
|
|
97 | return !(*this == b); |
|
|
98 | } |
|
|
99 | }; |
|
|
100 | |
|
|
101 | inline int strlen (const shstr &sh) |
|
|
102 | { |
|
|
103 | return sh.length (); |
|
|
104 | } |
|
|
105 | |
|
|
106 | inline int strcmp (const shstr &a, const shstr &b) |
|
|
107 | { |
|
|
108 | // TODO: use this to find all the occurences of people using strcmp |
|
|
109 | // all uses should be bogus, as we should be never interested in |
|
|
110 | // comparing shstr's alphabetically |
|
|
111 | #if 0 |
|
|
112 | extern void do_not_use_strcmp_to_compare_shstr_values (); |
|
|
113 | do_not_use_strcmp_to_compare_shstr_values (); |
|
|
114 | #endif |
|
|
115 | return a != b; |
|
|
116 | } |
|
|
117 | |
|
|
118 | static std::ostream &operator <<(std::ostream &o, const shstr &sh) |
|
|
119 | { |
|
|
120 | o.write (sh.s, sh.length ()); |
|
|
121 | return o; |
|
|
122 | } |
|
|
123 | |
|
|
124 | // only good for mass comparisons to shstr objects |
|
|
125 | struct shstr_cmp |
|
|
126 | { |
|
|
127 | const char *s; |
|
|
128 | |
|
|
129 | explicit shstr_cmp (const char *s) |
|
|
130 | : s (shstr::find (s)) |
|
|
131 | { |
|
|
132 | } |
|
|
133 | |
|
|
134 | shstr_cmp (const shstr_cmp &sh) |
|
|
135 | : s (sh.s) |
|
|
136 | { |
|
|
137 | } |
|
|
138 | |
|
|
139 | shstr_cmp &operator =(const shstr_cmp sh) { s = sh.s; return *this; } |
|
|
140 | operator const char *() const { return s; } |
|
|
141 | }; |
|
|
142 | |
|
|
143 | inline bool operator ==(const shstr_cmp &a, const shstr &b) |
|
|
144 | { |
|
|
145 | return a.s == b.s; |
|
|
146 | } |
|
|
147 | |
|
|
148 | inline bool operator ==(const shstr &a, const shstr_cmp &b) |
|
|
149 | { |
|
|
150 | return b == a; |
|
|
151 | } |
|
|
152 | |
|
|
153 | extern const shstr undead_name; /* Used in hit_player() in main.c */ |
|
|
154 | |
12 | #endif |
155 | #endif |
13 | |
156 | |
14 | /* In the unlikely occurence that 16383 references to a string are too |
|
|
15 | * few, you can modify the below type to something bigger. |
|
|
16 | * (The top bit of "refcount" is used to signify that "u.array" points |
|
|
17 | * at the array entry.) |
|
|
18 | */ |
|
|
19 | #define REFCOUNT_TYPE int |
|
|
20 | |
|
|
21 | /* The offsetof macro is part of ANSI C, but many compilers lack it, for |
|
|
22 | * example "gcc -ansi" |
|
|
23 | */ |
|
|
24 | #if !defined (offsetof) |
|
|
25 | #define offsetof(type, member) (int)&(((type *)0)->member) |
|
|
26 | #endif |
|
|
27 | |
|
|
28 | /* SS(string) will return the address of the shared_string struct which |
|
|
29 | * contains "string". |
|
|
30 | */ |
|
|
31 | #define SS(x) ((shared_string *) ((x) - offsetof(shared_string, string))) |
|
|
32 | |
|
|
33 | #define SS_STATISTICS |
|
|
34 | |
|
|
35 | #define SS_DUMP_TABLE 1 |
|
|
36 | #define SS_DUMP_TOTALS 2 |
|
|
37 | |
|
|
38 | #ifdef SS_STATISTICS |
|
|
39 | static struct statistics { |
|
|
40 | int calls; |
|
|
41 | int hashed; |
|
|
42 | int strcmps; |
|
|
43 | int search; |
|
|
44 | int linked; |
|
|
45 | } add_stats, add_ref_stats, free_stats, find_stats, hash_stats; |
|
|
46 | #define GATHER(n) (++n) |
|
|
47 | #else /* !SS_STATISTICS */ |
|
|
48 | #define GATHER(n) |
|
|
49 | #endif /* SS_STATISTICS */ |
|
|
50 | |
|
|
51 | #define TOPBIT ((unsigned REFCOUNT_TYPE) 1 << (sizeof(REFCOUNT_TYPE) * CHAR_BIT - 1)) |
|
|
52 | |
|
|
53 | #define PADDING ((2 * sizeof(long) - sizeof(REFCOUNT_TYPE)) % sizeof(long)) + 1 |
|
|
54 | |
|
|
55 | typedef struct _shared_string { |
|
|
56 | union { |
|
|
57 | struct _shared_string **array; |
|
|
58 | struct _shared_string *previous; |
|
|
59 | } u; |
|
|
60 | struct _shared_string *next; |
|
|
61 | /* The top bit of "refcount" is used to signify that "u.array" points |
|
|
62 | * at the array entry. |
|
|
63 | */ |
|
|
64 | unsigned REFCOUNT_TYPE refcount; |
|
|
65 | /* Padding will be unused memory, since we can't know how large |
|
|
66 | * the padding when allocating memory. We assume here that |
|
|
67 | * sizeof(long) is a good boundary. |
|
|
68 | */ |
|
|
69 | char string[PADDING]; |
|
|
70 | } shared_string; |
|
|