summaryrefslogtreecommitdiff
blob: aef4d87fd6ce96ac74020642dd1e0d9e90f7a70e (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
#ifndef ARTIFEX_EXTRACT_AUTOSTRING_XML
#define ARTIFEX_EXTRACT_AUTOSTRING_XML

/* Only for internal use by extract code.  */

/* A simple string struct that reallocs as required. */
typedef struct
{
    char*   chars;      /* NULL or zero-terminated. */
    size_t  chars_num;  /* Length of string pointed to by .chars. */
} extract_astring_t;

void extract_astring_init(extract_astring_t* string);
/* Initialises <string> so it is ready for use. */

void extract_astring_free(extract_alloc_t* alloc, extract_astring_t* string);
/* Frees any existing data and returns with <string> ready for use as if by
extract_astring_init(). */

int extract_astring_catl(extract_alloc_t* alloc, extract_astring_t* string, const char* s, size_t s_len);

int extract_astring_catc(extract_alloc_t* alloc, extract_astring_t* string, char c);

int extract_astring_cat(extract_alloc_t* alloc, extract_astring_t* string, const char* s);
int extract_astring_catf(extract_alloc_t* alloc, extract_astring_t* string, const char* format, ...);

int extract_astring_truncate(extract_astring_t* content, int len);
/* Removes last <len> chars. */

int extract_astring_char_truncate_if(extract_astring_t* content, char c);
/* Removes last char if it is <c>. */

int extract_astring_cat_xmlc(extract_alloc_t* alloc, extract_astring_t* string, int c);
/* Appends specified character using XML escapes as necessary. */

int extract_astring_catc_unicode(
        extract_alloc_t* alloc,
        extract_astring_t* string,
        int c,
        int xml,
        int ascii_ligatures,
        int ascii_dash,
        int ascii_apostrophe
        );
/* Appends unicode character <c> to <string>.
    xml:
        If true, we use XML escape sequences for special characters such as '<'
        and unicode values above 127. Otherwise we encode as utf8.
    ascii_ligatures: if true we expand ligatures to "fl", "fi" etc.
    ascii_dash:
        If true we replace unicode dash characters with '-'.
    ascii_apostrophe:
        If true we replace unicode apostrophe with ascii single-quote "'".
*/

int extract_astring_catc_unicode_xml(extract_alloc_t* alloc, extract_astring_t* string, int c);
/* Appends specific unicode character, using XML escape sequences as required. */

#endif