• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /* GLIB - Library of useful routines for C programming
2  * Copyright (C) 1995-1997  Peter Mattis, Spencer Kimball and Josh MacDonald
3  *
4  * This library is free software; you can redistribute it and/or
5  * modify it under the terms of the GNU Lesser General Public
6  * License as published by the Free Software Foundation; either
7  * version 2.1 of the License, or (at your option) any later version.
8  *
9  * This library is distributed in the hope that it will be useful,
10  * but WITHOUT ANY WARRANTY; without even the implied warranty of
11  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
12  * Lesser General Public License for more details.
13  *
14  * You should have received a copy of the GNU Lesser General Public
15  * License along with this library; if not, see <http://www.gnu.org/licenses/>.
16  */
17 
18 /*
19  * Modified by the GLib Team and others 1997-2000.  See the AUTHORS
20  * file for a list of people on the GLib Team.  See the ChangeLog
21  * files for a list of changes.  These files are distributed with
22  * GLib at ftp://ftp.gtk.org/pub/gtk/.
23  */
24 
25 /*
26  * MT safe
27  */
28 
29 #include "config.h"
30 
31 #include <string.h>
32 
33 #include "gstringchunk.h"
34 
35 #include "ghash.h"
36 #include "gslist.h"
37 #include "gmessages.h"
38 
39 #include "gutils.h"
40 
41 /**
42  * SECTION:string_chunks
43  * @title: String Chunks
44  * @short_description: efficient storage of groups of strings
45  *
46  * String chunks are used to store groups of strings. Memory is
47  * allocated in blocks, and as strings are added to the #GStringChunk
48  * they are copied into the next free position in a block. When a block
49  * is full a new block is allocated.
50  *
51  * When storing a large number of strings, string chunks are more
52  * efficient than using g_strdup() since fewer calls to malloc() are
53  * needed, and less memory is wasted in memory allocation overheads.
54  *
55  * By adding strings with g_string_chunk_insert_const() it is also
56  * possible to remove duplicates.
57  *
58  * To create a new #GStringChunk use g_string_chunk_new().
59  *
60  * To add strings to a #GStringChunk use g_string_chunk_insert().
61  *
62  * To add strings to a #GStringChunk, but without duplicating strings
63  * which are already in the #GStringChunk, use
64  * g_string_chunk_insert_const().
65  *
66  * To free the entire #GStringChunk use g_string_chunk_free(). It is
67  * not possible to free individual strings.
68  */
69 
70 /**
71  * GStringChunk:
72  *
73  * An opaque data structure representing String Chunks.
74  * It should only be accessed by using the following functions.
75  */
76 struct _GStringChunk
77 {
78   GHashTable *const_table;
79   GSList     *storage_list;
80   gsize       storage_next;
81   gsize       this_size;
82   gsize       default_size;
83 };
84 
85 #define MY_MAXSIZE ((gsize)-1)
86 
87 static inline gsize
nearest_power(gsize base,gsize num)88 nearest_power (gsize base,
89                gsize num)
90 {
91   if (num > MY_MAXSIZE / 2)
92     {
93       return MY_MAXSIZE;
94     }
95   else
96     {
97       gsize n = base;
98 
99       while (n < num)
100         n <<= 1;
101 
102       return n;
103     }
104 }
105 
106 /**
107  * g_string_chunk_new:
108  * @size: the default size of the blocks of memory which are
109  *     allocated to store the strings. If a particular string
110  *     is larger than this default size, a larger block of
111  *     memory will be allocated for it.
112  *
113  * Creates a new #GStringChunk.
114  *
115  * Returns: a new #GStringChunk
116  */
117 GStringChunk *
g_string_chunk_new(gsize size)118 g_string_chunk_new (gsize size)
119 {
120   GStringChunk *new_chunk = g_new (GStringChunk, 1);
121   gsize actual_size = 1;
122 
123   actual_size = nearest_power (1, size);
124 
125   new_chunk->const_table  = NULL;
126   new_chunk->storage_list = NULL;
127   new_chunk->storage_next = actual_size;
128   new_chunk->default_size = actual_size;
129   new_chunk->this_size    = actual_size;
130 
131   return new_chunk;
132 }
133 
134 /**
135  * g_string_chunk_free:
136  * @chunk: a #GStringChunk
137  *
138  * Frees all memory allocated by the #GStringChunk.
139  * After calling g_string_chunk_free() it is not safe to
140  * access any of the strings which were contained within it.
141  */
142 void
g_string_chunk_free(GStringChunk * chunk)143 g_string_chunk_free (GStringChunk *chunk)
144 {
145   g_return_if_fail (chunk != NULL);
146 
147   if (chunk->storage_list)
148     g_slist_free_full (chunk->storage_list, g_free);
149 
150   if (chunk->const_table)
151     g_hash_table_destroy (chunk->const_table);
152 
153   g_free (chunk);
154 }
155 
156 /**
157  * g_string_chunk_clear:
158  * @chunk: a #GStringChunk
159  *
160  * Frees all strings contained within the #GStringChunk.
161  * After calling g_string_chunk_clear() it is not safe to
162  * access any of the strings which were contained within it.
163  *
164  * Since: 2.14
165  */
166 void
g_string_chunk_clear(GStringChunk * chunk)167 g_string_chunk_clear (GStringChunk *chunk)
168 {
169   g_return_if_fail (chunk != NULL);
170 
171   if (chunk->storage_list)
172     {
173       g_slist_free_full (chunk->storage_list, g_free);
174 
175       chunk->storage_list = NULL;
176       chunk->storage_next = chunk->default_size;
177       chunk->this_size    = chunk->default_size;
178     }
179 
180   if (chunk->const_table)
181       g_hash_table_remove_all (chunk->const_table);
182 }
183 
184 /**
185  * g_string_chunk_insert:
186  * @chunk: a #GStringChunk
187  * @string: the string to add
188  *
189  * Adds a copy of @string to the #GStringChunk.
190  * It returns a pointer to the new copy of the string
191  * in the #GStringChunk. The characters in the string
192  * can be changed, if necessary, though you should not
193  * change anything after the end of the string.
194  *
195  * Unlike g_string_chunk_insert_const(), this function
196  * does not check for duplicates. Also strings added
197  * with g_string_chunk_insert() will not be searched
198  * by g_string_chunk_insert_const() when looking for
199  * duplicates.
200  *
201  * Returns: a pointer to the copy of @string within
202  *     the #GStringChunk
203  */
204 gchar*
g_string_chunk_insert(GStringChunk * chunk,const gchar * string)205 g_string_chunk_insert (GStringChunk *chunk,
206                        const gchar  *string)
207 {
208   g_return_val_if_fail (chunk != NULL, NULL);
209 
210   return g_string_chunk_insert_len (chunk, string, -1);
211 }
212 
213 /**
214  * g_string_chunk_insert_const:
215  * @chunk: a #GStringChunk
216  * @string: the string to add
217  *
218  * Adds a copy of @string to the #GStringChunk, unless the same
219  * string has already been added to the #GStringChunk with
220  * g_string_chunk_insert_const().
221  *
222  * This function is useful if you need to copy a large number
223  * of strings but do not want to waste space storing duplicates.
224  * But you must remember that there may be several pointers to
225  * the same string, and so any changes made to the strings
226  * should be done very carefully.
227  *
228  * Note that g_string_chunk_insert_const() will not return a
229  * pointer to a string added with g_string_chunk_insert(), even
230  * if they do match.
231  *
232  * Returns: a pointer to the new or existing copy of @string
233  *     within the #GStringChunk
234  */
235 gchar*
g_string_chunk_insert_const(GStringChunk * chunk,const gchar * string)236 g_string_chunk_insert_const (GStringChunk *chunk,
237                              const gchar  *string)
238 {
239   char* lookup;
240 
241   g_return_val_if_fail (chunk != NULL, NULL);
242 
243   if (!chunk->const_table)
244     chunk->const_table = g_hash_table_new (g_str_hash, g_str_equal);
245 
246   lookup = (char*) g_hash_table_lookup (chunk->const_table, (gchar *)string);
247 
248   if (!lookup)
249     {
250       lookup = g_string_chunk_insert (chunk, string);
251       g_hash_table_add (chunk->const_table, lookup);
252     }
253 
254   return lookup;
255 }
256 
257 /**
258  * g_string_chunk_insert_len:
259  * @chunk: a #GStringChunk
260  * @string: bytes to insert
261  * @len: number of bytes of @string to insert, or -1 to insert a
262  *     nul-terminated string
263  *
264  * Adds a copy of the first @len bytes of @string to the #GStringChunk.
265  * The copy is nul-terminated.
266  *
267  * Since this function does not stop at nul bytes, it is the caller's
268  * responsibility to ensure that @string has at least @len addressable
269  * bytes.
270  *
271  * The characters in the returned string can be changed, if necessary,
272  * though you should not change anything after the end of the string.
273  *
274  * Returns: a pointer to the copy of @string within the #GStringChunk
275  *
276  * Since: 2.4
277  */
278 gchar*
g_string_chunk_insert_len(GStringChunk * chunk,const gchar * string,gssize len)279 g_string_chunk_insert_len (GStringChunk *chunk,
280                            const gchar  *string,
281                            gssize        len)
282 {
283   gssize size;
284   gchar* pos;
285 
286   g_return_val_if_fail (chunk != NULL, NULL);
287 
288   if (len < 0)
289     size = strlen (string);
290   else
291     size = len;
292 
293   if ((chunk->storage_next + size + 1) > chunk->this_size)
294     {
295       gsize new_size = nearest_power (chunk->default_size, size + 1);
296 
297       chunk->storage_list = g_slist_prepend (chunk->storage_list,
298                                              g_new (gchar, new_size));
299 
300       chunk->this_size = new_size;
301       chunk->storage_next = 0;
302     }
303 
304   pos = ((gchar *) chunk->storage_list->data) + chunk->storage_next;
305 
306   *(pos + size) = '\0';
307 
308   memcpy (pos, string, size);
309 
310   chunk->storage_next += size + 1;
311 
312   return pos;
313 }
314