annotate src/misc.c @ 1221:f34b803b8639

Handle signed chars. Aadded dIsspace() and dIsalnum() to dlib
author Jorge Arellano Cid <jcid@dillo.org>
date Sun, 12 Jul 2009 16:53:16 -0400
parents 94bca98ac942
children 83a462cf5d02
rev   line source
0
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
1 /*
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
2 * File: misc.c
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
3 *
35
d9e7b35430de Updated copyright lines
jcid
parents: 0
diff changeset
4 * Copyright (C) 2000 Jörgen Viksell <vsksga@hotmail.com>
d9e7b35430de Updated copyright lines
jcid
parents: 0
diff changeset
5 * Copyright (C) 2000-2007 Jorge Arellano Cid <jcid@dillo.org>,
0
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
6 *
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
7 * This program is free software; you can redistribute it and/or modify
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
8 * it under the terms of the GNU General Public License as published by
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
9 * the Free Software Foundation; either version 3 of the License, or
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
10 * (at your option) any later version.
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
11 */
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
12
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
13 #include <stdio.h>
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
14 #include <stdlib.h>
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
15 #include <string.h>
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
16 #include <ctype.h>
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
17
1128
fbe2ce98a4b8 make tab expansion for plain text utf8 aware
Johannes Hofmann <Johannes.Hofmann@gmx.de>
parents: 930
diff changeset
18 #include "utf8.hh"
0
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
19 #include "msg.h"
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
20 #include "misc.h"
1145
9b57a492918b Improved recognition heuristics for plain text in utf8
corvid <corvid@lavabit.com>
parents: 1141
diff changeset
21 #include "utf8.hh"
0
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
22
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
23 /*
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
24 * Escape characters as %XX sequences.
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
25 * Return value: New string.
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
26 */
306
7a76f872ce73 - Eliminated gcc 4.2.3 warnings on 64bit OS.
jcid
parents: 274
diff changeset
27 char *a_Misc_escape_chars(const char *str, const char *esc_set)
0
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
28 {
1141
corvid <corvid@lavabit.com>
parents: 1128
diff changeset
29 static const char *const hex = "0123456789ABCDEF";
0
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
30 char *p = NULL;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
31 Dstr *dstr;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
32 int i;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
33
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
34 dstr = dStr_sized_new(64);
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
35 for (i = 0; str[i]; ++i) {
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
36 if (str[i] <= 0x1F || str[i] == 0x7F || strchr(esc_set, str[i])) {
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
37 dStr_append_c(dstr, '%');
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
38 dStr_append_c(dstr, hex[(str[i] >> 4) & 15]);
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
39 dStr_append_c(dstr, hex[str[i] & 15]);
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
40 } else {
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
41 dStr_append_c(dstr, str[i]);
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
42 }
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
43 }
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
44 p = dstr->str;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
45 dStr_free(dstr, FALSE);
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
46
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
47 return p;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
48 }
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
49
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
50 #define TAB_SIZE 8
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
51 /*
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
52 * Takes a string and converts any tabs to spaces.
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
53 */
340
da33058e94be - Fixed a memory leak in plain.cc.
jcid
parents: 306
diff changeset
54 char *a_Misc_expand_tabs(const char *str, int len)
0
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
55 {
1128
fbe2ce98a4b8 make tab expansion for plain text utf8 aware
Johannes Hofmann <Johannes.Hofmann@gmx.de>
parents: 930
diff changeset
56 int i = 0, j, pos = 0, old_pos, char_len;
fbe2ce98a4b8 make tab expansion for plain text utf8 aware
Johannes Hofmann <Johannes.Hofmann@gmx.de>
parents: 930
diff changeset
57 uint_t code;
0
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
58 char *val;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
59
1160
ea163ab97e87 faster expand tabs
corvid <corvid@lavabit.com>
parents: 1145
diff changeset
60 if (memchr(str, '\t', len) == NULL) {
ea163ab97e87 faster expand tabs
corvid <corvid@lavabit.com>
parents: 1145
diff changeset
61 val = dStrndup(str, len);
ea163ab97e87 faster expand tabs
corvid <corvid@lavabit.com>
parents: 1145
diff changeset
62 } else {
ea163ab97e87 faster expand tabs
corvid <corvid@lavabit.com>
parents: 1145
diff changeset
63 Dstr *New = dStr_new("");
1128
fbe2ce98a4b8 make tab expansion for plain text utf8 aware
Johannes Hofmann <Johannes.Hofmann@gmx.de>
parents: 930
diff changeset
64
1160
ea163ab97e87 faster expand tabs
corvid <corvid@lavabit.com>
parents: 1145
diff changeset
65 while (i < len) {
ea163ab97e87 faster expand tabs
corvid <corvid@lavabit.com>
parents: 1145
diff changeset
66 code = a_Utf8_decode(&str[i], str + len, &char_len);
ea163ab97e87 faster expand tabs
corvid <corvid@lavabit.com>
parents: 1145
diff changeset
67
ea163ab97e87 faster expand tabs
corvid <corvid@lavabit.com>
parents: 1145
diff changeset
68 if (code == '\t') {
ea163ab97e87 faster expand tabs
corvid <corvid@lavabit.com>
parents: 1145
diff changeset
69 /* Fill with whitespaces until the next tab. */
ea163ab97e87 faster expand tabs
corvid <corvid@lavabit.com>
parents: 1145
diff changeset
70 old_pos = pos;
ea163ab97e87 faster expand tabs
corvid <corvid@lavabit.com>
parents: 1145
diff changeset
71 pos += TAB_SIZE - (pos % TAB_SIZE);
ea163ab97e87 faster expand tabs
corvid <corvid@lavabit.com>
parents: 1145
diff changeset
72 for (j = old_pos; j < pos; j++)
ea163ab97e87 faster expand tabs
corvid <corvid@lavabit.com>
parents: 1145
diff changeset
73 dStr_append_c(New, ' ');
ea163ab97e87 faster expand tabs
corvid <corvid@lavabit.com>
parents: 1145
diff changeset
74 } else {
ea163ab97e87 faster expand tabs
corvid <corvid@lavabit.com>
parents: 1145
diff changeset
75 dStr_append_l(New, &str[i], char_len);
ea163ab97e87 faster expand tabs
corvid <corvid@lavabit.com>
parents: 1145
diff changeset
76 pos++;
ea163ab97e87 faster expand tabs
corvid <corvid@lavabit.com>
parents: 1145
diff changeset
77 }
ea163ab97e87 faster expand tabs
corvid <corvid@lavabit.com>
parents: 1145
diff changeset
78
ea163ab97e87 faster expand tabs
corvid <corvid@lavabit.com>
parents: 1145
diff changeset
79 i += char_len;
0
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
80 }
1128
fbe2ce98a4b8 make tab expansion for plain text utf8 aware
Johannes Hofmann <Johannes.Hofmann@gmx.de>
parents: 930
diff changeset
81
1160
ea163ab97e87 faster expand tabs
corvid <corvid@lavabit.com>
parents: 1145
diff changeset
82 val = New->str;
ea163ab97e87 faster expand tabs
corvid <corvid@lavabit.com>
parents: 1145
diff changeset
83 dStr_free(New, FALSE);
0
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
84 }
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
85 return val;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
86 }
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
87
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
88 /* TODO: could use dStr ADT! */
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
89 typedef struct ContentType_ {
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
90 const char *str;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
91 int len;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
92 } ContentType_t;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
93
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
94 static const ContentType_t MimeTypes[] = {
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
95 { "application/octet-stream", 24 },
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
96 { "text/html", 9 },
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
97 { "text/plain", 10 },
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
98 { "image/gif", 9 },
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
99 { "image/png", 9 },
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
100 { "image/jpeg", 10 },
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
101 { NULL, 0 }
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
102 };
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
103
250
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
104 typedef enum {
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
105 DT_OCTET_STREAM = 0,
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
106 DT_TEXT_HTML,
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
107 DT_TEXT_PLAIN,
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
108 DT_IMAGE_GIF,
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
109 DT_IMAGE_PNG,
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
110 DT_IMAGE_JPG,
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
111 } DetectedContentType;
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
112
0
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
113 /*
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
114 * Detects 'Content-Type' from a data stream sample.
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
115 *
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
116 * It uses the magic(5) logic from file(1). Currently, it
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
117 * only checks the few mime types that Dillo supports.
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
118 *
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
119 * 'Data' is a pointer to the first bytes of the raw data.
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
120 *
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
121 * Return value: (0 on success, 1 on doubt, 2 on lack of data).
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
122 */
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
123 int a_Misc_get_content_type_from_data(void *Data, size_t Size, const char **PT)
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
124 {
250
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
125 size_t i, non_ascci, non_ascci_text, bin_chars;
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
126 char *p = Data;
0
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
127 int st = 1; /* default to "doubt' */
250
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
128 DetectedContentType Type = DT_OCTET_STREAM; /* default to binary */
0
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
129
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
130 /* HTML try */
1221
f34b803b8639 Handle signed chars. Aadded dIsspace() and dIsalnum() to dlib
Jorge Arellano Cid <jcid@dillo.org>
parents: 1186
diff changeset
131 for (i = 0; i < Size && dIsspace(p[i]); ++i);
0
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
132 if ((Size - i >= 5 && !dStrncasecmp(p+i, "<html", 5)) ||
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
133 (Size - i >= 5 && !dStrncasecmp(p+i, "<head", 5)) ||
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
134 (Size - i >= 6 && !dStrncasecmp(p+i, "<title", 6)) ||
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
135 (Size - i >= 14 && !dStrncasecmp(p+i, "<!doctype html", 14)) ||
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
136 /* this line is workaround for FTP through the Squid proxy */
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
137 (Size - i >= 17 && !dStrncasecmp(p+i, "<!-- HTML listing", 17))) {
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
138
250
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
139 Type = DT_TEXT_HTML;
0
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
140 st = 0;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
141 /* Images */
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
142 } else if (Size >= 4 && !dStrncasecmp(p, "GIF8", 4)) {
250
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
143 Type = DT_IMAGE_GIF;
0
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
144 st = 0;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
145 } else if (Size >= 4 && !dStrncasecmp(p, "\x89PNG", 4)) {
250
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
146 Type = DT_IMAGE_PNG;
0
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
147 st = 0;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
148 } else if (Size >= 2 && !dStrncasecmp(p, "\xff\xd8", 2)) {
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
149 /* JPEG has the first 2 bytes set to 0xffd8 in BigEndian - looking
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
150 * at the character representation should be machine independent. */
250
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
151 Type = DT_IMAGE_JPG;
0
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
152 st = 0;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
153
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
154 /* Text */
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
155 } else {
250
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
156 /* Heuristic for "text/plain"
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
157 * {ASCII, LATIN1, UTF8, KOI8-R, CP-1251}
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
158 * All in the above set regard [00-31] as control characters.
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
159 * LATIN1: [7F-9F] unused
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
160 * CP-1251 {7F,98} unused (two characters).
930
b277eed3119c whitespace cleanup: 's/ +$//g'
Jorge Arellano Cid <jcid@dillo.org>
parents: 368
diff changeset
161 *
250
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
162 * We'll use [0-31] as indicators of non-text content.
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
163 * Better heuristics are welcomed! :-) */
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
164
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
165 non_ascci = non_ascci_text = bin_chars = 0;
0
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
166 Size = MIN (Size, 256);
250
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
167 for (i = 0; i < Size; i++) {
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
168 int ch = (uchar_t) p[i];
1221
f34b803b8639 Handle signed chars. Aadded dIsspace() and dIsalnum() to dlib
Jorge Arellano Cid <jcid@dillo.org>
parents: 1186
diff changeset
169 if (ch < 32 && !dIsspace(ch))
250
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
170 ++bin_chars;
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
171 if (ch > 126)
0
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
172 ++non_ascci;
250
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
173 if (ch > 190)
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
174 ++non_ascci_text;
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
175 }
1145
9b57a492918b Improved recognition heuristics for plain text in utf8
corvid <corvid@lavabit.com>
parents: 1141
diff changeset
176 if (bin_chars == 0 && (non_ascci - non_ascci_text) <= Size/10) {
250
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
177 /* Let's say text: if "rare" chars are <= 10% */
1145
9b57a492918b Improved recognition heuristics for plain text in utf8
corvid <corvid@lavabit.com>
parents: 1141
diff changeset
178 Type = DT_TEXT_PLAIN;
9b57a492918b Improved recognition heuristics for plain text in utf8
corvid <corvid@lavabit.com>
parents: 1141
diff changeset
179 } else if (Size > 0) {
9b57a492918b Improved recognition heuristics for plain text in utf8
corvid <corvid@lavabit.com>
parents: 1141
diff changeset
180 /* a special check for UTF-8 */
9b57a492918b Improved recognition heuristics for plain text in utf8
corvid <corvid@lavabit.com>
parents: 1141
diff changeset
181 Size = a_Utf8_end_of_char(p, Size - 1) + 1;
9b57a492918b Improved recognition heuristics for plain text in utf8
corvid <corvid@lavabit.com>
parents: 1141
diff changeset
182 if (a_Utf8_test(p, Size) > 0)
250
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
183 Type = DT_TEXT_PLAIN;
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
184 }
1145
9b57a492918b Improved recognition heuristics for plain text in utf8
corvid <corvid@lavabit.com>
parents: 1141
diff changeset
185 if (Size >= 256)
0
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
186 st = 0;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
187 }
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
188
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
189 *PT = MimeTypes[Type].str;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
190 return st;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
191 }
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
192
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
193 /*
250
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
194 * Parse Content-Type string, e.g., "text/html; charset=utf-8".
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
195 */
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
196 void a_Misc_parse_content_type(const char *str, char **major, char **minor,
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
197 char **charset)
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
198 {
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
199 const char *s;
1166
6d2de3dccef1 only parse charset parameter for text/* media types
corvid <corvid@lavabit.com>
parents: 1160
diff changeset
200 bool_t is_text;
250
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
201
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
202 if (major)
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
203 *major = NULL;
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
204 if (minor)
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
205 *minor = NULL;
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
206 if (charset)
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
207 *charset = NULL;
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
208 if (!str)
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
209 return;
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
210
1221
f34b803b8639 Handle signed chars. Aadded dIsspace() and dIsalnum() to dlib
Jorge Arellano Cid <jcid@dillo.org>
parents: 1186
diff changeset
211 for (s = str; dIsalnum(*s) || (*s == '-'); s++);
250
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
212 if (major)
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
213 *major = dStrndup(str, s - str);
1166
6d2de3dccef1 only parse charset parameter for text/* media types
corvid <corvid@lavabit.com>
parents: 1160
diff changeset
214 is_text = (s - str == 4) && !dStrncasecmp(str, "text", 4);
250
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
215
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
216 if (*s == '/') {
1221
f34b803b8639 Handle signed chars. Aadded dIsspace() and dIsalnum() to dlib
Jorge Arellano Cid <jcid@dillo.org>
parents: 1186
diff changeset
217 for (str = ++s; dIsalnum(*s) || (*s == '-'); s++);
250
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
218 if (minor)
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
219 *minor = dStrndup(str, s - str);
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
220 }
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
221
1166
6d2de3dccef1 only parse charset parameter for text/* media types
corvid <corvid@lavabit.com>
parents: 1160
diff changeset
222 if (is_text && charset && *s) {
6d2de3dccef1 only parse charset parameter for text/* media types
corvid <corvid@lavabit.com>
parents: 1160
diff changeset
223 /* charset parameter is defined for text media type (RFC 2046) */
250
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
224 const char terminators[] = " ;\t";
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
225 const char key[] = "charset";
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
226
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
227 if ((s = dStristr(str, key)) &&
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
228 (s == str || strchr(terminators, s[-1]))) {
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
229 s += sizeof(key) - 1;
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
230 for ( ; *s == ' ' || *s == '\t'; ++s);
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
231 if (*s == '=') {
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
232 size_t len;
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
233 for (++s; *s == ' ' || *s == '\t'; ++s);
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
234 if ((len = strcspn(s, terminators))) {
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
235 if (*s == '"' && s[len-1] == '"' && len > 1) {
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
236 /* quoted string */
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
237 s++;
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
238 len -= 2;
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
239 }
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
240 *charset = dStrndup(s, len);
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
241 }
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
242 }
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
243 }
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
244 }
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
245 }
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
246
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
247 /*
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
248 * Compare two Content-Type strings.
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
249 * Return 0 if they are equivalent, and 1 otherwise.
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
250 */
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
251 int a_Misc_content_type_cmp(const char *ct1, const char *ct2)
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
252 {
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
253 char *major1, *major2, *minor1, *minor2, *charset1, *charset2;
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
254 int ret;
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
255
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
256 if ((!ct1 || !*ct1) && (!ct2 || !*ct2))
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
257 return 0;
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
258 if ((!ct1 || !*ct1) || (!ct2 || !*ct2))
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
259 return 1;
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
260
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
261 a_Misc_parse_content_type(ct1, &major1, &minor1, &charset1);
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
262 a_Misc_parse_content_type(ct2, &major2, &minor2, &charset2);
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
263
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
264 if (major1 && major2 && !dStrcasecmp(major1, major2) &&
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
265 minor1 && minor2 && !dStrcasecmp(minor1, minor2) &&
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
266 ((!charset1 && !charset2) ||
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
267 (charset1 && charset2 && !dStrcasecmp(charset1, charset2)) ||
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
268 (!charset1 && charset2 && !dStrcasecmp(charset2, "UTF-8")) ||
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
269 (charset1 && !charset2 && !dStrcasecmp(charset1, "UTF-8")))) {
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
270 ret = 0;
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
271 } else {
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
272 ret = 1;
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
273 }
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
274 dFree(major1); dFree(major2);
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
275 dFree(minor1); dFree(minor2);
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
276 dFree(charset1); dFree(charset2);
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
277
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
278 return ret;
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
279 }
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
280
fce9380ee68a - Switched from charset to content-type for handling data.
jcid
parents: 180
diff changeset
281 /*
0
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
282 * Check the server-supplied 'Content-Type' against our detected type.
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
283 * (some servers seem to default to "text/plain").
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
284 *
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
285 * Return value:
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
286 * 0, if they match
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
287 * -1, if a mismatch is detected
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
288 *
155
fb8da086d7da + s/there're/there are/g
jcid
parents: 35
diff changeset
289 * There are many MIME types Dillo doesn't know, they're handled
0
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
290 * as "application/octet-stream" (as the SPEC says).
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
291 *
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
292 * A mismatch happens when receiving a binary stream as
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
293 * "text/plain" or "text/html", or an image that's not an image of its kind.
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
294 *
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
295 * Note: this is a basic security procedure.
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
296 *
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
297 */
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
298 int a_Misc_content_type_check(const char *EntryType, const char *DetectedType)
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
299 {
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
300 int i;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
301 int st = -1;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
302
274
1deca4cad4c4 - Implemented OBJECT as link (similar to FRAME).
jcid
parents: 250
diff changeset
303 _MSG("Type check: [Srv: %s Det: %s]\n", EntryType, DetectedType);
0
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
304
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
305 if (!EntryType)
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
306 return 0; /* there's no mismatch without server type */
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
307
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
308 for (i = 1; MimeTypes[i].str; ++i)
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
309 if (dStrncasecmp(EntryType, MimeTypes[i].str, MimeTypes[i].len) == 0)
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
310 break;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
311
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
312 if (!MimeTypes[i].str) {
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
313 /* type not found, no mismatch */
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
314 st = 0;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
315 } else if (dStrncasecmp(EntryType, "image/", 6) == 0 &&
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
316 !dStrncasecmp(DetectedType,MimeTypes[i].str,MimeTypes[i].len)){
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
317 /* An image, and there's an exact match */
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
318 st = 0;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
319 } else if (dStrncasecmp(EntryType, "text/", 5) ||
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
320 dStrncasecmp(DetectedType, "application/", 12)) {
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
321 /* Not an application sent as text */
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
322 st = 0;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
323 }
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
324
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
325 return st;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
326 }
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
327
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
328 /*
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
329 * Parse a geometry string.
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
330 */
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
331 int a_Misc_parse_geometry(char *str, int *x, int *y, int *w, int *h)
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
332 {
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
333 char *p, *t1, *t2;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
334 int n1, n2;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
335 int ret = 0;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
336
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
337 if ((p = strchr(str, 'x')) || (p = strchr(str, 'X'))) {
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
338 n1 = strtol(str, &t1, 10);
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
339 n2 = strtol(++p, &t2, 10);
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
340 if (t1 != str && t2 != p) {
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
341 *w = n1;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
342 *h = n2;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
343 ret = 1;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
344 /* parse x,y now */
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
345 p = t2;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
346 n1 = strtol(p, &t1, 10);
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
347 n2 = strtol(t1, &t2, 10);
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
348 if (t1 != p && t2 != t1) {
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
349 *x = n1;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
350 *y = n2;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
351 }
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
352 }
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
353 }
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
354 _MSG("geom: w,h,x,y = (%d,%d,%d,%d)\n", *w, *h, *x, *y);
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
355 return ret;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
356 }
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
357
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
358 /*
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
359 * Encodes string using base64 encoding.
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
360 * Return value: new string or NULL if input string is empty.
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
361 */
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
362 char *a_Misc_encode_base64(const char *in)
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
363 {
1141
corvid <corvid@lavabit.com>
parents: 1128
diff changeset
364 static const char *const base64_hex = "ABCDEFGHIJKLMNOPQRSTUVWXYZ"
corvid <corvid@lavabit.com>
parents: 1128
diff changeset
365 "abcdefghijklmnopqrstuvwxyz"
corvid <corvid@lavabit.com>
parents: 1128
diff changeset
366 "0123456789+/";
0
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
367 char *out = NULL;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
368 int len, i = 0;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
369
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
370 if (in == NULL) return NULL;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
371 len = strlen(in);
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
372
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
373 out = (char *)dMalloc((len + 2) / 3 * 4 + 1);
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
374
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
375 for (; len >= 3; len -= 3) {
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
376 out[i++] = base64_hex[in[0] >> 2];
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
377 out[i++] = base64_hex[((in[0]<<4) & 0x30) | (in[1]>>4)];
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
378 out[i++] = base64_hex[((in[1]<<2) & 0x3c) | (in[2]>>6)];
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
379 out[i++] = base64_hex[in[2] & 0x3f];
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
380 in += 3;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
381 }
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
382
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
383 if (len > 0) {
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
384 unsigned char fragment;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
385 out[i++] = base64_hex[in[0] >> 2];
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
386 fragment = (in[0] << 4) & 0x30;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
387 if (len > 1) fragment |= in[1] >> 4;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
388 out[i++] = base64_hex[fragment];
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
389 out[i++] = (len < 2) ? '=' : base64_hex[(in[1] << 2) & 0x3c];
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
390 out[i++] = '=';
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
391 }
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
392 out[i] = '\0';
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
393 return out;
6ee11bf9e3ea Initial revision
jcid
parents:
diff changeset
394 }
180
0038a2943cc2 - Made file inputs free the loaded file after the page is left.
jcid
parents: 155
diff changeset
395
0038a2943cc2 - Made file inputs free the loaded file after the page is left.
jcid
parents: 155
diff changeset
396 /*
0038a2943cc2 - Made file inputs free the loaded file after the page is left.
jcid
parents: 155
diff changeset
397 * Load a local file into a dStr.
0038a2943cc2 - Made file inputs free the loaded file after the page is left.
jcid
parents: 155
diff changeset
398 * Return value: dStr on success, NULL on error.
368
2242da885677 - s/todo:/TODO:/g
jcid
parents: 340
diff changeset
399 * TODO: a filesize threshold may be implemented.
180
0038a2943cc2 - Made file inputs free the loaded file after the page is left.
jcid
parents: 155
diff changeset
400 */
0038a2943cc2 - Made file inputs free the loaded file after the page is left.
jcid
parents: 155
diff changeset
401 Dstr *a_Misc_file2dstr(const char *filename)
0038a2943cc2 - Made file inputs free the loaded file after the page is left.
jcid
parents: 155
diff changeset
402 {
0038a2943cc2 - Made file inputs free the loaded file after the page is left.
jcid
parents: 155
diff changeset
403 FILE *F_in;
0038a2943cc2 - Made file inputs free the loaded file after the page is left.
jcid
parents: 155
diff changeset
404 int n;
0038a2943cc2 - Made file inputs free the loaded file after the page is left.
jcid
parents: 155
diff changeset
405 char buf[4096];
0038a2943cc2 - Made file inputs free the loaded file after the page is left.
jcid
parents: 155
diff changeset
406 Dstr *dstr = NULL;
0038a2943cc2 - Made file inputs free the loaded file after the page is left.
jcid
parents: 155
diff changeset
407
0038a2943cc2 - Made file inputs free the loaded file after the page is left.
jcid
parents: 155
diff changeset
408 if ((F_in = fopen(filename, "r"))) {
0038a2943cc2 - Made file inputs free the loaded file after the page is left.
jcid
parents: 155
diff changeset
409 dstr = dStr_sized_new(4096);
0038a2943cc2 - Made file inputs free the loaded file after the page is left.
jcid
parents: 155
diff changeset
410 while ((n = fread (buf, 1, 4096, F_in)) > 0) {
0038a2943cc2 - Made file inputs free the loaded file after the page is left.
jcid
parents: 155
diff changeset
411 dStr_append_l(dstr, buf, n);
0038a2943cc2 - Made file inputs free the loaded file after the page is left.
jcid
parents: 155
diff changeset
412 }
0038a2943cc2 - Made file inputs free the loaded file after the page is left.
jcid
parents: 155
diff changeset
413 fclose(F_in);
0038a2943cc2 - Made file inputs free the loaded file after the page is left.
jcid
parents: 155
diff changeset
414 }
0038a2943cc2 - Made file inputs free the loaded file after the page is left.
jcid
parents: 155
diff changeset
415 return dstr;
0038a2943cc2 - Made file inputs free the loaded file after the page is left.
jcid
parents: 155
diff changeset
416 }