add Joe
[python.git] / Include / stringobject.h
blob18b5b411aca6943b2d0b560f9a1faeaaedba84b0
2 /* String (str/bytes) object interface */
4 #ifndef Py_STRINGOBJECT_H
5 #define Py_STRINGOBJECT_H
6 #ifdef __cplusplus
7 extern "C" {
8 #endif
10 #include <stdarg.h>
13 Type PyStringObject represents a character string. An extra zero byte is
14 reserved at the end to ensure it is zero-terminated, but a size is
15 present so strings with null bytes in them can be represented. This
16 is an immutable object type.
18 There are functions to create new string objects, to test
19 an object for string-ness, and to get the
20 string value. The latter function returns a null pointer
21 if the object is not of the proper type.
22 There is a variant that takes an explicit size as well as a
23 variant that assumes a zero-terminated string. Note that none of the
24 functions should be applied to nil objects.
27 /* Caching the hash (ob_shash) saves recalculation of a string's hash value.
28 Interning strings (ob_sstate) tries to ensure that only one string
29 object with a given value exists, so equality tests can be one pointer
30 comparison. This is generally restricted to strings that "look like"
31 Python identifiers, although the intern() builtin can be used to force
32 interning of any string.
33 Together, these sped the interpreter by up to 20%. */
35 typedef struct {
36 PyObject_VAR_HEAD
37 long ob_shash;
38 int ob_sstate;
39 char ob_sval[1];
41 /* Invariants:
42 * ob_sval contains space for 'ob_size+1' elements.
43 * ob_sval[ob_size] == 0.
44 * ob_shash is the hash of the string or -1 if not computed yet.
45 * ob_sstate != 0 iff the string object is in stringobject.c's
46 * 'interned' dictionary; in this case the two references
47 * from 'interned' to this object are *not counted* in ob_refcnt.
49 } PyStringObject;
51 #define SSTATE_NOT_INTERNED 0
52 #define SSTATE_INTERNED_MORTAL 1
53 #define SSTATE_INTERNED_IMMORTAL 2
55 PyAPI_DATA(PyTypeObject) PyBaseString_Type;
56 PyAPI_DATA(PyTypeObject) PyString_Type;
58 #define PyString_Check(op) \
59 PyType_FastSubclass(Py_TYPE(op), Py_TPFLAGS_STRING_SUBCLASS)
60 #define PyString_CheckExact(op) (Py_TYPE(op) == &PyString_Type)
62 PyAPI_FUNC(PyObject *) PyString_FromStringAndSize(const char *, Py_ssize_t);
63 PyAPI_FUNC(PyObject *) PyString_FromString(const char *);
64 PyAPI_FUNC(PyObject *) PyString_FromFormatV(const char*, va_list)
65 Py_GCC_ATTRIBUTE((format(printf, 1, 0)));
66 PyAPI_FUNC(PyObject *) PyString_FromFormat(const char*, ...)
67 Py_GCC_ATTRIBUTE((format(printf, 1, 2)));
68 PyAPI_FUNC(Py_ssize_t) PyString_Size(PyObject *);
69 PyAPI_FUNC(char *) PyString_AsString(PyObject *);
70 PyAPI_FUNC(PyObject *) PyString_Repr(PyObject *, int);
71 PyAPI_FUNC(void) PyString_Concat(PyObject **, PyObject *);
72 PyAPI_FUNC(void) PyString_ConcatAndDel(PyObject **, PyObject *);
73 PyAPI_FUNC(int) _PyString_Resize(PyObject **, Py_ssize_t);
74 PyAPI_FUNC(int) _PyString_Eq(PyObject *, PyObject*);
75 PyAPI_FUNC(PyObject *) PyString_Format(PyObject *, PyObject *);
76 PyAPI_FUNC(PyObject *) _PyString_FormatLong(PyObject*, int, int,
77 int, char**, int*);
78 PyAPI_FUNC(PyObject *) PyString_DecodeEscape(const char *, Py_ssize_t,
79 const char *, Py_ssize_t,
80 const char *);
82 PyAPI_FUNC(void) PyString_InternInPlace(PyObject **);
83 PyAPI_FUNC(void) PyString_InternImmortal(PyObject **);
84 PyAPI_FUNC(PyObject *) PyString_InternFromString(const char *);
85 PyAPI_FUNC(void) _Py_ReleaseInternedStrings(void);
87 /* Use only if you know it's a string */
88 #define PyString_CHECK_INTERNED(op) (((PyStringObject *)(op))->ob_sstate)
90 /* Macro, trading safety for speed */
91 #define PyString_AS_STRING(op) (((PyStringObject *)(op))->ob_sval)
92 #define PyString_GET_SIZE(op) Py_SIZE(op)
94 /* _PyString_Join(sep, x) is like sep.join(x). sep must be PyStringObject*,
95 x must be an iterable object. */
96 PyAPI_FUNC(PyObject *) _PyString_Join(PyObject *sep, PyObject *x);
98 /* --- Generic Codecs ----------------------------------------------------- */
100 /* Create an object by decoding the encoded string s of the
101 given size. */
103 PyAPI_FUNC(PyObject*) PyString_Decode(
104 const char *s, /* encoded string */
105 Py_ssize_t size, /* size of buffer */
106 const char *encoding, /* encoding */
107 const char *errors /* error handling */
110 /* Encodes a char buffer of the given size and returns a
111 Python object. */
113 PyAPI_FUNC(PyObject*) PyString_Encode(
114 const char *s, /* string char buffer */
115 Py_ssize_t size, /* number of chars to encode */
116 const char *encoding, /* encoding */
117 const char *errors /* error handling */
120 /* Encodes a string object and returns the result as Python
121 object. */
123 PyAPI_FUNC(PyObject*) PyString_AsEncodedObject(
124 PyObject *str, /* string object */
125 const char *encoding, /* encoding */
126 const char *errors /* error handling */
129 /* Encodes a string object and returns the result as Python string
130 object.
132 If the codec returns an Unicode object, the object is converted
133 back to a string using the default encoding.
135 DEPRECATED - use PyString_AsEncodedObject() instead. */
137 PyAPI_FUNC(PyObject*) PyString_AsEncodedString(
138 PyObject *str, /* string object */
139 const char *encoding, /* encoding */
140 const char *errors /* error handling */
143 /* Decodes a string object and returns the result as Python
144 object. */
146 PyAPI_FUNC(PyObject*) PyString_AsDecodedObject(
147 PyObject *str, /* string object */
148 const char *encoding, /* encoding */
149 const char *errors /* error handling */
152 /* Decodes a string object and returns the result as Python string
153 object.
155 If the codec returns an Unicode object, the object is converted
156 back to a string using the default encoding.
158 DEPRECATED - use PyString_AsDecodedObject() instead. */
160 PyAPI_FUNC(PyObject*) PyString_AsDecodedString(
161 PyObject *str, /* string object */
162 const char *encoding, /* encoding */
163 const char *errors /* error handling */
166 /* Provides access to the internal data buffer and size of a string
167 object or the default encoded version of an Unicode object. Passing
168 NULL as *len parameter will force the string buffer to be
169 0-terminated (passing a string with embedded NULL characters will
170 cause an exception). */
172 PyAPI_FUNC(int) PyString_AsStringAndSize(
173 register PyObject *obj, /* string or Unicode object */
174 register char **s, /* pointer to buffer variable */
175 register Py_ssize_t *len /* pointer to length variable or NULL
176 (only possible for 0-terminated
177 strings) */
181 /* Using the current locale, insert the thousands grouping
182 into the string pointed to by buffer. For the argument descriptions,
183 see Objects/stringlib/localeutil.h */
184 PyAPI_FUNC(Py_ssize_t) _PyString_InsertThousandsGroupingLocale(char *buffer,
185 Py_ssize_t n_buffer,
186 char *digits,
187 Py_ssize_t n_digits,
188 Py_ssize_t min_width);
190 /* Using explicit passed-in values, insert the thousands grouping
191 into the string pointed to by buffer. For the argument descriptions,
192 see Objects/stringlib/localeutil.h */
193 PyAPI_FUNC(Py_ssize_t) _PyString_InsertThousandsGrouping(char *buffer,
194 Py_ssize_t n_buffer,
195 char *digits,
196 Py_ssize_t n_digits,
197 Py_ssize_t min_width,
198 const char *grouping,
199 const char *thousands_sep);
201 /* Format the object based on the format_spec, as defined in PEP 3101
202 (Advanced String Formatting). */
203 PyAPI_FUNC(PyObject *) _PyBytes_FormatAdvanced(PyObject *obj,
204 char *format_spec,
205 Py_ssize_t format_spec_len);
207 #ifdef __cplusplus
209 #endif
210 #endif /* !Py_STRINGOBJECT_H */