forked from shlomif/perl-XML-LibXML
-
Notifications
You must be signed in to change notification settings - Fork 0
/
perl-libxml-mm.h
372 lines (314 loc) · 10.6 KB
/
perl-libxml-mm.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
/**
* perl-libxml-mm.h
* $Id$
*
* Basic concept:
* perl varies in the implementation of UTF8 handling. this header (together
* with the c source) implements a few functions, that can be used from within
* the core module in order to avoid cascades of c pragmas
*/
#ifndef __PERL_LIBXML_MM_H__
#define __PERL_LIBXML_MM_H__
#ifdef __cplusplus
extern "C" {
#endif
#include "EXTERN.h"
#include "perl.h"
#include <libxml/parser.h>
#ifdef __cplusplus
}
#endif
/*
* NAME xs_warn
* TYPE MACRO
*
* this makro is for XML::LibXML development and debugging.
*
* SYNOPSIS
* xs_warn("my warning")
*
* this makro takes only a single string(!) and passes it to perls
* warn function if the XS_WARNRINGS pragma is used at compile time
* otherwise any xs_warn call is ignored.
*
* pay attention, that xs_warn does not implement a complete wrapper
* for warn!!
*/
#ifdef XS_WARNINGS
#define xs_warn(string) warn("%s",string)
#else
#define xs_warn(string)
#endif
/*
* @node: Reference to the node the structure proxies
* @owner: libxml defines only the document, but not the node owner
* (in case of document fragments, they are not the same!)
* @count: this is the internal reference count!
* @encoding: this value is missing in libxml2's doc structure
*
* Since XML::LibXML will not know, is a certain node is already
* defined in the perl layer, it can't surely tell when a node can be
* safely be removed from the memory. This structure helps to keep
* track how intense the nodes of a document are used and will not
* delete the nodes unless they are not referred from somewhere else.
*/
struct _ProxyNode {
xmlNodePtr node;
xmlNodePtr owner;
int count;
};
struct _DocProxyNode {
xmlNodePtr node;
xmlNodePtr owner;
int count;
int encoding; /* only used for proxies of xmlDocPtr */
int psvi_status; /* see below ... */
};
/* the psvi_status flag requires some explanation:
each time libxml2 validates a document (using DTD, Schema or
RelaxNG) it stores a pointer to a last successfully applied grammar
rule in node->psvi. Upon next validation, if libxml2 wants to check
that node matches some grammar rule, it first compares the rule
pointer and node->psvi. If these are equal, the validation of the
node's subtree is skipped and the node is assumed to match the
rule.
This causes problems when the tree is modified and then
re-validated or when the schema is freed and the document is
revalidated using a different schema and by bad chance a rule
tested against some node got allocated to the exact same location
as the rule from the schema used for the prior validation, already
freed, but still pointed to by node->psvi).
Thus, the node->psvi values can't be trusted at all and we want to
make sure all psvi slots are NULL before each validation. To aviod
traversing the tree in the most common case, when each document is
validated just once, we maintain the psvi_status flag.
Validating a document triggers this flag (sets it to 1). The
document with psvi_status==1 is traversed and psvi slots are nulled
prior to any validation. When the flag is triggered, it remains
triggered for the rest of the document's life, there is no way to
null it (even nulling up the psvi's does not null the flag, because
there may be unlinked parts of the document floating around which
we don't know about and thus cannot null their psvi pointers; these
unlinked document parts would cause inconsistency when re-attached
to the document tree).
Also, importing a node from a document with psvi_status==1 to a
document with psvi_status==0 automatically triggers psvi_status on
the target document.
NOTE: We could alternatively just null psvis from any imported
subtrees, but that would add an O(n) cleanup operation (n the size
of the imported subtree) on every importNode (possibly needlessly
since the target document may not ever be revalidated) whereas
triggering the flag is O(1) and possibly adds one O(N) cleanup
operation (N the size of the document) to the first validation of
the target document (any subsequent re-validation of the document
would have to perform the operation anyway). The sum of all n's may
be less then N, but OTH, there is a great chance that the O(N)
cleanup will never be performed. (BTW, validation is at least
O(N), probably O(Nlog N) anyway, so the cleanup has little impact;
similarly, importNode does xmlSetTreeDoc which is also O(n). So in
fact, neither solution should have significant performance impact
overall....).
*/
#define Pmm_NO_PSVI 0
#define Pmm_PSVI_TAINTED 1
/* helper type for the proxy structure */
typedef struct _DocProxyNode DocProxyNode;
typedef struct _ProxyNode ProxyNode;
/* pointer to the proxy structure */
typedef ProxyNode* ProxyNodePtr;
typedef DocProxyNode* DocProxyNodePtr;
/* this my go only into the header used by the xs */
#define SvPROXYNODE(x) (INT2PTR(ProxyNodePtr,SvIV(SvRV(x))))
#define PmmPROXYNODE(x) (INT2PTR(ProxyNodePtr,x->_private))
#define SvNAMESPACE(x) (INT2PTR(xmlNsPtr,SvIV(SvRV(x))))
#define PmmREFCNT(node) node->count
#define PmmREFCNT_inc(node) node->count++
#define PmmNODE(xnode) xnode->node
#define PmmOWNER(node) node->owner
#define PmmOWNERPO(node) ((node && PmmOWNER(node)) ? (ProxyNodePtr)PmmOWNER(node)->_private : node)
#define PmmENCODING(node) ((DocProxyNodePtr)(node))->encoding
#define PmmNodeEncoding(node) ((DocProxyNodePtr)(node->_private))->encoding
#define SetPmmENCODING(node,code) PmmENCODING(node)=(code)
#define SetPmmNodeEncoding(node,code) PmmNodeEncoding(node)=(code)
#define PmmInvalidatePSVI(doc) if (doc && doc->_private) ((DocProxyNodePtr)(doc->_private))->psvi_status = Pmm_PSVI_TAINTED;
#define PmmIsPSVITainted(doc) (doc && doc->_private && (((DocProxyNodePtr)(doc->_private))->psvi_status == Pmm_PSVI_TAINTED))
#define PmmClearPSVI(node) if (node && node->doc && node->doc->_private && \
((DocProxyNodePtr)(node->doc->_private))->psvi_status == Pmm_PSVI_TAINTED) \
domClearPSVI((xmlNodePtr) node)
#ifndef NO_XML_LIBXML_THREADS
#ifdef USE_ITHREADS
#define XML_LIBXML_THREADS
#endif
#endif
#ifdef XML_LIBXML_THREADS
/* structure for storing thread-local refcount */
struct _LocalProxyNode {
ProxyNodePtr proxy;
int count;
};
typedef struct _LocalProxyNode LocalProxyNode;
typedef LocalProxyNode* LocalProxyNodePtr;
#define PmmUSEREGISTRY (PROXY_NODE_REGISTRY_MUTEX != NULL)
#define PmmREGISTRY (INT2PTR(xmlHashTablePtr,SvIV(SvRV(get_sv("XML::LibXML::__PROXY_NODE_REGISTRY",0)))))
/* #define PmmREGISTRY (INT2PTR(xmlHashTablePtr,SvIV(SvRV(PROXY_NODE_REGISTRY)))) */
void
PmmCloneProxyNodes();
int
PmmProxyNodeRegistrySize();
void
PmmDumpRegistry(xmlHashTablePtr r);
void
PmmRegistryREFCNT_dec(ProxyNodePtr proxy);
#endif
void
PmmFreeHashTable(xmlHashTablePtr table);
ProxyNodePtr
PmmNewNode(xmlNodePtr node);
ProxyNodePtr
PmmNewFragment(xmlDocPtr document);
SV*
PmmCreateDocNode( unsigned int type, ProxyNodePtr pdoc, ...);
int
PmmREFCNT_dec( ProxyNodePtr node );
SV*
PmmNodeToSv( xmlNodePtr node, ProxyNodePtr owner );
/* PmmFixProxyEncoding
* TYPE
* Method
* PARAMETER
* @dfProxy: The proxystructure to fix.
*
* DESCRIPTION
*
* This little helper allows to fix the proxied encoding information
* after a not standard operation was done. This is required for
* XML::LibXSLT
*/
void
PmmFixProxyEncoding( ProxyNodePtr dfProxy );
/* PmmSvNodeExt
* TYPE
* Function
* PARAMETER
* @perlnode: the perl reference that holds the scalar.
* @copy : copy flag
*
* DESCRIPTION
*
* The function recognizes XML::LibXML and XML::GDOME
* nodes as valid input data. The second parameter 'copy'
* indicates if in case of GDOME nodes the libxml2 node
* should be copied. In some cases, where the node is
* cloned anyways, this flag has to be set to '0', while
* the default value should be allways '1'.
*/
xmlNodePtr
PmmSvNodeExt( SV * perlnode, int copy );
/* PmmSvNode
* TYPE
* Macro
* PARAMETER
* @perlnode: a perl reference that holds a libxml node
*
* DESCRIPTION
*
* PmmSvNode fetches the libxml node such as PmmSvNodeExt does. It is
* a wrapper, that sets the copy always to 1, which is good for all
* cases XML::LibXML uses.
*/
#define PmmSvNode(n) PmmSvNodeExt(n,1)
xmlNodePtr
PmmSvOwner( SV * perlnode );
SV*
PmmSetSvOwner(SV * perlnode, SV * owner );
int
PmmFixOwner(ProxyNodePtr node, ProxyNodePtr newOwner );
void
PmmFixOwnerNode(xmlNodePtr node, ProxyNodePtr newOwner );
int
PmmContextREFCNT_dec( ProxyNodePtr node );
SV*
PmmContextSv( xmlParserCtxtPtr ctxt );
xmlParserCtxtPtr
PmmSvContext( SV * perlctxt );
/**
* NAME PmmCopyNode
* TYPE function
*
* returns libxml2 node
*
* DESCRIPTION
* This function implements a nodetype independent node cloning.
*
* Note that this function has to stay in this module, since
* XML::LibXSLT reuses it.
*/
xmlNodePtr
PmmCloneNode( xmlNodePtr node , int deep );
/**
* NAME PmmNodeToGdomeSv
* TYPE function
*
* returns XML::GDOME node
*
* DESCRIPTION
* creates an Gdome node from our XML::LibXML node.
* this function is very useful for the parser.
*
* the function will only work, if XML::LibXML is compiled with
* XML::GDOME support.
*
*/
SV *
PmmNodeToGdomeSv( xmlNodePtr node );
/**
* NAME PmmNodeTypeName
* TYPE function
*
* returns the perl class name for the given node
*
* SYNOPSIS
* CLASS = PmmNodeTypeName( node );
*/
const char*
PmmNodeTypeName( xmlNodePtr elem );
xmlChar*
PmmEncodeString( const char *encoding, const xmlChar *string, STRLEN len );
char*
PmmDecodeString( const char *encoding, const xmlChar *string, STRLEN* len);
/* string manipulation will go elsewhere! */
/*
* NAME c_string_to_sv
* TYPE function
* SYNOPSIS
* SV *my_sv = c_string_to_sv( "my string", encoding );
*
* this function converts a libxml2 string to a SV*. although the
* string is copied, the func does not free the c-string for you!
*
* encoding is either NULL or a encoding string such as provided by
* the documents encoding. if encoding is NULL UTF8 is assumed.
*
*/
SV*
C2Sv( const xmlChar *string, const xmlChar *encoding );
/*
* NAME sv_to_c_string
* TYPE function
* SYNOPSIS
* SV *my_sv = sv_to_c_string( my_sv, encoding );
*
* this function converts a SV* to a libxml string. the SV-value will
* be copied into a *newly* allocated string. (don't forget to free it!)
*
* encoding is either NULL or a encoding string such as provided by
* the documents encoding. if encoding is NULL UTF8 is assumed.
*
*/
xmlChar *
Sv2C( SV* scalar, const xmlChar *encoding );
SV*
nodeC2Sv( const xmlChar * string, xmlNodePtr refnode );
xmlChar *
nodeSv2C( SV * scalar, xmlNodePtr refnode );
#endif