1 |
/* |
2 |
* gen_html4.c - Part of psiconv, a PSION 5 data formats converter |
3 |
* Copyright (c) 1999 Andrew Johnson <anjohnson@iee.org> |
4 |
* Portions Copyright (c) 1999 Frodo Looijaard <frodol@dds.nl> |
5 |
* |
6 |
* This program is free software; you can redistribute it and/or modify |
7 |
* it under the terms of the GNU General Public License as published by |
8 |
* the Free Software Foundation; either version 2 of the License, or |
9 |
* (at your option) any later version. |
10 |
* |
11 |
* This program is distributed in the hope that it will be useful, |
12 |
* but WITHOUT ANY WARRANTY; without even the implied warranty of |
13 |
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
14 |
* GNU General Public License for more details. |
15 |
* |
16 |
* You should have received a copy of the GNU General Public License |
17 |
* along with this program; if not, write to the Free Software |
18 |
* Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. |
19 |
*/ |
20 |
|
21 |
#include "config.h" |
22 |
#include <stdio.h> |
23 |
#include <string.h> |
24 |
#include <ctype.h> |
25 |
#include <stdlib.h> |
26 |
#include "psiconv/data.h" |
27 |
#include "psiconv/list.h" |
28 |
#include "gen.h" |
29 |
#include "psiconv.h" |
30 |
|
31 |
#ifndef TRUE |
32 |
#define TRUE (0==0) |
33 |
#endif |
34 |
|
35 |
#ifdef DMALLOC |
36 |
#include "dmalloc.h" |
37 |
#endif |
38 |
|
39 |
/* |
40 |
* Various string tables for HTML4 settings |
41 |
*/ |
42 |
|
43 |
/* How to display each character */ |
44 |
static const char *char_table[0x100] = { |
45 |
/* 0x00 */ "", "", "", "", "", "", "<BR>\n", "<BR>\n", |
46 |
/* 0x08 */ "\n<HR>\n", "\t", "", "", "", "", "", "", |
47 |
/* 0x10 */ " ", "", "", "", "", "", "", "", |
48 |
/* 0x18 */ "", "", "", "", "", "", "", "", |
49 |
/* 0x20 */ " ", "!", """, "#", "$", "%", "&", "'", |
50 |
/* 0x28 */ "(", ")", "*", "+", ",", "-", ".", "/", |
51 |
/* 0x30 */ "0", "1", "2", "3", "4", "5", "6", "7", |
52 |
/* 0x38 */ "8", "9", ":", ";", "<", "=", ">", "?", |
53 |
/* 0x40 */ "@", "A", "B", "C", "D", "E", "F", "G", |
54 |
/* 0x48 */ "H", "I", "J", "K", "L", "M", "N", "O", |
55 |
/* 0x50 */ "P", "Q", "R", "S", "T", "U", "V", "W", |
56 |
/* 0x58 */ "X", "Y", "Z", "[", "\\", "]", "^", "_", |
57 |
/* 0x60 */ "`", "a", "b", "c", "d", "e", "f", "g", |
58 |
/* 0x68 */ "h", "i", "j", "k", "l", "m", "n", "o", |
59 |
/* 0x70 */ "p", "q", "r", "s", "t", "u", "v", "w", |
60 |
/* 0x78 */ "x", "y", "z", "{", "|", "}", "~", "", |
61 |
/* 0x80 */ "", "", "‚", "ƒ", |
62 |
"„", "…", "†", "‡", |
63 |
/* 0x88 */ "ˆ", "‰", "Š", "<", |
64 |
"Œ", "", "", "", |
65 |
/* 0x90 */ "", "‘", "’", "“", |
66 |
"”","•", "–", "—", |
67 |
/* 0x98 */ "˜", "™", "š", ">", |
68 |
"œ", "", "", "Ÿ", |
69 |
/* 0xa0 */ " ", "¡", "¢", "£", |
70 |
"¤", "¥", "¦", "§", |
71 |
/* 0xa8 */ "¨", "©", "ª", "«", |
72 |
"¬", "­", "®", "¯", |
73 |
/* 0xb0 */ "°", "±", "²", "³", |
74 |
"´", "µ", "¶", "·", |
75 |
/* 0xb8 */ "¸", "¹", "º", "»", |
76 |
"¼", "½", "¾", "¿", |
77 |
/* 0xc0 */ "À", "Á", "Â", "Ã", |
78 |
"Ä", "Å", "Æ", "Ç", |
79 |
/* 0xc8 */ "È", "É", "Ê", "Ë", |
80 |
"Ì", "Í", "Î", "Ï", |
81 |
/* 0xd0 */ "Ð", "Ñ", "Ò", "Ó", |
82 |
"Ô", "Õ", "Ö", "×", |
83 |
/* 0xd8 */ "Ø", "Ù", "Ú", "Û", |
84 |
"Ü", "Ý", "Þ", "ß", |
85 |
/* 0xe0 */ "à", "á", "â", "ã", |
86 |
"ä", "å", "æ", "ç", |
87 |
/* 0xe8 */ "è", "é", "ê", "ë", |
88 |
"ì", "í", "î", "ï", |
89 |
/* 0xf0 */ "ð", "ñ", "ò", "ó", |
90 |
"ô", "õ", "ö", "÷", |
91 |
/* 0xf8 */ "ø", "ù", "ú", "û", |
92 |
"ü", "ý", "þ", "ÿ" |
93 |
}; |
94 |
|
95 |
/* The order of these must match the enum psiconv_border_kind (data.h) */ |
96 |
static const char *border_strings[] = { |
97 |
"none", "solid", "double", "dotted", "dashed", "dashed", "dotted" |
98 |
}; |
99 |
|
100 |
/* The order of these must match the enum psiconv_justify (data.h) */ |
101 |
static const char *justify_strings[] = { |
102 |
"left", "center", "right", "justify" |
103 |
}; |
104 |
|
105 |
/* The order of these must match the enum psiconv_super_sub (data.h) */ |
106 |
static const char *vertical_strings[] = { |
107 |
"baseline", "super", "sub" |
108 |
}; |
109 |
|
110 |
|
111 |
/* |
112 |
* Support routines for particular formatting structures |
113 |
*/ |
114 |
|
115 |
static void fput_name(FILE * of, const char *string) { |
116 |
int i; |
117 |
|
118 |
for (i = 0; i < strlen(string); i++) |
119 |
if (isalnum(string[i])) |
120 |
putc(string[i], of); |
121 |
} |
122 |
|
123 |
static void fput_text(FILE * of, const char *text, int length, int *pwasspace) { |
124 |
int j; |
125 |
int space; |
126 |
|
127 |
for (j = 0; j < length; j++) { |
128 |
space = (text[j] == ' '); |
129 |
if (*pwasspace && space) |
130 |
fputs(" ", of); |
131 |
else |
132 |
fputs(char_table[(unsigned char) (text[j])], of); |
133 |
*pwasspace = space; |
134 |
} |
135 |
} |
136 |
|
137 |
static const char *screenfont_name(psiconv_u8 screenfont) |
138 |
{ |
139 |
if (screenfont == psiconv_font_sansserif) |
140 |
return "sans-serif"; |
141 |
else if (screenfont == psiconv_font_nonprop) |
142 |
return "monospace"; |
143 |
else if (screenfont == psiconv_font_serif) |
144 |
return "serif"; |
145 |
else |
146 |
return "serif"; |
147 |
} |
148 |
|
149 |
static const char *generic_font_family(const char *font_name) { |
150 |
static const char *sans_font_names[] = { |
151 |
"Arial", "Univers", "Sans Serif" |
152 |
}; |
153 |
static const char *mono_font_names[] = { |
154 |
"Courier New", "Courier", "Mono", "Lineprinter", "Elite", "Swiss", |
155 |
"Courier (compressed)", "Courier (expanded)", "Letter Gothic" |
156 |
}; |
157 |
int i; |
158 |
|
159 |
for (i=0; i < sizeof(sans_font_names) / sizeof(sans_font_names[0]); i++) |
160 |
if (!strcmp(font_name, sans_font_names[i])) |
161 |
return "sans-serif"; |
162 |
|
163 |
for (i=0; i < sizeof(mono_font_names) / sizeof(mono_font_names[0]); i++) |
164 |
if (!strcmp(font_name, mono_font_names[i])) |
165 |
return "monospace"; |
166 |
|
167 |
return "serif"; |
168 |
} |
169 |
|
170 |
static int colors_different( |
171 |
const psiconv_color old, |
172 |
const psiconv_color new) |
173 |
{ |
174 |
return ((old->red != new->red) || |
175 |
(old->green != new->green) || |
176 |
(old->blue != new->blue)); |
177 |
} |
178 |
|
179 |
|
180 |
/* Borders */ |
181 |
static int borders_different( |
182 |
const psiconv_border old, |
183 |
const psiconv_border new) |
184 |
{ |
185 |
return (!old || |
186 |
(old->kind != new->kind) || |
187 |
colors_different(old->color, new->color) || |
188 |
(old->thickness != new->thickness)); |
189 |
} |
190 |
|
191 |
static void fput_border(FILE * of, |
192 |
const char *which, |
193 |
const psiconv_border old, |
194 |
const psiconv_border new) |
195 |
{ |
196 |
/* If the border changed at all we'll set all parameters, as they're |
197 |
* fairly closely linked and it's much easier to do it this way */ |
198 |
if (borders_different(old, new)) { |
199 |
fprintf(of, "border-%s-style:%s;", |
200 |
which, border_strings[new->kind]); |
201 |
if ((new->kind != psiconv_border_none) && |
202 |
(new->color->red || new->color->green || new->color->blue)) |
203 |
fprintf(of, "border-%s-color:#%02x%02x%02x;", which, |
204 |
new->color->red, new->color->green, new->color->blue); |
205 |
if ((new->kind == psiconv_border_solid) || |
206 |
(new->kind == psiconv_border_double)) |
207 |
fprintf(of, "border-%s-width:%.0fpx;", |
208 |
which, (new->thickness / 10.0) - 1); |
209 |
else if (new->kind != psiconv_border_none) |
210 |
fprintf(of, "border-%s-width:1px;", which); |
211 |
} |
212 |
} |
213 |
|
214 |
/* Paragraph formats */ |
215 |
static int paragraph_layouts_different( |
216 |
const psiconv_paragraph_layout old, |
217 |
const psiconv_paragraph_layout new) |
218 |
{ |
219 |
return ((old->space_above != new->space_above) || |
220 |
(old->indent_right != new->indent_right) || |
221 |
(old->space_below != new->space_below) || |
222 |
(old->indent_left != new->indent_left) || |
223 |
(old->indent_first != new->indent_first) || |
224 |
(old->justify_hor != new->justify_hor) || |
225 |
(old->linespacing_exact != new->linespacing_exact) || |
226 |
borders_different(old->left_border, new->left_border) || |
227 |
borders_different(old->right_border, new->right_border) || |
228 |
borders_different(old->top_border, new->top_border) || |
229 |
borders_different(old->bottom_border, new->bottom_border)); |
230 |
} |
231 |
|
232 |
static void fput_paragraph_layout(FILE * of, |
233 |
const psiconv_paragraph_layout old, |
234 |
const psiconv_paragraph_layout new) |
235 |
{ |
236 |
if (!old || (old->space_above != new->space_above)) |
237 |
fprintf(of, "margin-top:%.1fpt;", new->space_above); |
238 |
if (!old || (old->indent_right != new->indent_right)) |
239 |
fprintf(of, "margin-right:%.2fcm;", new->indent_right); |
240 |
if (!old || (old->space_below != new->space_below)) |
241 |
fprintf(of, "margin-bottom:%.1fpt;", new->space_below); |
242 |
if (!old || |
243 |
(old->bullet->on != new->bullet->on) || |
244 |
(old->bullet->indent != new->bullet->indent) || |
245 |
(old->indent_left != new->indent_left) || |
246 |
(old->indent_first != new->indent_first)) { |
247 |
psiconv_length_t indent = new->indent_first; |
248 |
psiconv_length_t margin = new->indent_left; |
249 |
/* Bullets with indent set cause strange margin behaviour: */ |
250 |
if (new->bullet->on && new->bullet->indent) { |
251 |
if (indent > 0.0) { |
252 |
margin += indent; |
253 |
indent = new->indent_left - indent; |
254 |
} |
255 |
} |
256 |
fprintf(of, "margin-left:%.2fcm;", margin); |
257 |
fprintf(of, "text-indent:%.2fcm;", indent); |
258 |
} |
259 |
if (!old || (old->justify_hor != new->justify_hor)) |
260 |
fprintf(of, "text-align:%s;", justify_strings[new->justify_hor]); |
261 |
if (!old || (old->linespacing_exact != new->linespacing_exact)) { |
262 |
if (!old || old->linespacing_exact) |
263 |
fputs("line-height:normal;", of); |
264 |
else |
265 |
fprintf(of, "line-height:%.1fpt;", new->linespacing); |
266 |
} |
267 |
fput_border(of, "left", old ? old->left_border : NULL, |
268 |
new->left_border); |
269 |
fput_border(of, "right", old ? old->right_border : NULL, |
270 |
new->right_border); |
271 |
fput_border(of, "top", old ? old->top_border : NULL, |
272 |
new->top_border); |
273 |
fput_border(of, "bottom", old ? old->bottom_border : NULL, |
274 |
new->bottom_border); |
275 |
} |
276 |
|
277 |
/* Character formats */ |
278 |
static int character_layouts_different( |
279 |
const psiconv_character_layout old, |
280 |
const psiconv_character_layout new) |
281 |
{ |
282 |
return ((old->font->screenfont != new->font->screenfont) || |
283 |
(strcmp(old->font->name,new->font->name)) || |
284 |
(old->font_size != new->font_size) || |
285 |
(old->color->red != new->color->red) || |
286 |
(old->color->green != new->color->green) || |
287 |
(old->color->blue != new->color->blue) || |
288 |
(old->back_color->red != new->back_color->red) || |
289 |
(old->back_color->green != new->back_color->green) || |
290 |
(old->back_color->blue != new->back_color->blue) || |
291 |
(old->italic != new->italic) || |
292 |
(old->bold != new->bold) || |
293 |
(old->super_sub != new->super_sub) || |
294 |
(old->underline != new->underline) || |
295 |
(old->strikethrough != new->strikethrough)); |
296 |
} |
297 |
|
298 |
static void fput_character_layout(FILE * of, |
299 |
const psiconv_character_layout old, |
300 |
const psiconv_character_layout new, |
301 |
psiconv_word_f wf) |
302 |
{ |
303 |
if (!old || (old->font->screenfont != new->font->screenfont) || |
304 |
strcmp(old->font->name,new->font->name)) { |
305 |
fprintf(of, "font-family:%s,%s,%s;", new->font->name, |
306 |
generic_font_family(new->font->name), |
307 |
screenfont_name(new->font->screenfont)); |
308 |
} |
309 |
if (!old || (old->font_size != new->font_size)) |
310 |
fprintf(of, "font-size:%.1f%%;", 100.0 * new->font_size / 10.0); |
311 |
if (!old || (old->bold != new->bold)) |
312 |
fprintf(of, "font-weight:%s;", new->bold ? "bold" : "normal"); |
313 |
if (!old || (old->italic != new->italic)) |
314 |
fprintf(of, "font-style:%s;", new->italic ? "italic" : "normal"); |
315 |
if (!old || (colors_different(old->color, new->color))) |
316 |
fprintf(of, "color:#%02x%02x%02x;", |
317 |
new->color->red, new->color->green, new->color->blue); |
318 |
if (!old || (colors_different(old->back_color, new->back_color))) |
319 |
fprintf(of, "background-color:#%02x%02x%02x;", |
320 |
new->back_color->red, new->back_color->green, new->back_color->blue); |
321 |
if (!old || (old->super_sub != new->super_sub)) |
322 |
fprintf(of, "vertical-align:%s;", vertical_strings[new->super_sub]); |
323 |
if (!old || (old->underline != new->underline) || |
324 |
(old->strikethrough != new->strikethrough)) { |
325 |
fputs("text-decoration:", of); |
326 |
if (new->strikethrough) |
327 |
fputs("line-through ", of); |
328 |
if (new->underline) |
329 |
fputs("underline", of); |
330 |
else if (!new->strikethrough) |
331 |
fputs("none", of); |
332 |
fputs(";", of); |
333 |
} |
334 |
} |
335 |
|
336 |
|
337 |
/* Formatted paragraphs */ |
338 |
static void fput_para(FILE * of, |
339 |
const psiconv_paragraph para, |
340 |
psiconv_word_f wf) |
341 |
{ |
342 |
psiconv_paragraph_layout base_para = para->base_paragraph; |
343 |
psiconv_character_layout base_char = para->base_character; |
344 |
psiconv_character_layout cur_char; |
345 |
psiconv_character_layout *layout_stack; |
346 |
psiconv_in_line_layout inl; |
347 |
psiconv_word_style sty; |
348 |
int spans = 0; |
349 |
int wasspace = 0; |
350 |
int i, j, loc; |
351 |
|
352 |
layout_stack = calloc(psiconv_list_length(para->in_lines), |
353 |
sizeof(*layout_stack)); |
354 |
fputs("<P", of); |
355 |
sty = psiconv_get_style(wf->styles_sec, para->base_style); |
356 |
cur_char = sty->character; |
357 |
|
358 |
if (sty->name) { |
359 |
fputs(" CLASS=\"", of); |
360 |
fput_name(of, sty->name); |
361 |
putc('"', of); |
362 |
} |
363 |
|
364 |
if (paragraph_layouts_different(sty->paragraph, base_para) || |
365 |
character_layouts_different(cur_char, base_char)) { |
366 |
fputs(" STYLE=\"", of); |
367 |
fput_paragraph_layout(of, sty->paragraph, base_para); |
368 |
fput_character_layout(of, cur_char, base_char, wf); |
369 |
cur_char = base_char; |
370 |
putc('"', of); |
371 |
} |
372 |
putc('>', of); |
373 |
|
374 |
if (base_para->bullet->on) { |
375 |
fputs("<SPAN STYLE=\"", of); |
376 |
if (base_para->bullet->font != base_char->font) { |
377 |
fprintf(of, "font-family:%s,%s,%s;", |
378 |
base_para->bullet->font->name, |
379 |
generic_font_family(base_para->bullet->font->name), |
380 |
screenfont_name(base_para->bullet->font->screenfont)); |
381 |
} |
382 |
if (base_para->bullet->font_size != base_char->font_size) |
383 |
fprintf(of, "font-size:%.1f%%;", |
384 |
100.0 * base_para->bullet->font_size / 10.0); |
385 |
if ((base_para->bullet->color->red != base_char->color->red) || |
386 |
(base_para->bullet->color->green != base_char->color->green) || |
387 |
(base_para->bullet->color->blue != base_char->color->blue)) |
388 |
fprintf(of, "color:#%02x%02x%02x;", |
389 |
base_para->bullet->color->red, |
390 |
base_para->bullet->color->green, |
391 |
base_para->bullet->color->blue); |
392 |
fprintf(of, "\">%s </SPAN>", |
393 |
char_table[base_para->bullet->character]); |
394 |
wasspace = TRUE; |
395 |
} |
396 |
|
397 |
loc = 0; |
398 |
for (i = 0; i < psiconv_list_length(para->in_lines); i++) { |
399 |
inl = psiconv_list_get(para->in_lines, i); |
400 |
if (character_layouts_different(cur_char, inl->layout)) { |
401 |
for (j = 0; j < spans; j++) |
402 |
if (!character_layouts_different(inl->layout, layout_stack[j])) |
403 |
break; |
404 |
if (j < spans) { |
405 |
while (spans > j) { |
406 |
fputs("</SPAN>",of); |
407 |
spans--; |
408 |
} |
409 |
} else { |
410 |
fputs("<SPAN STYLE=\"", of); |
411 |
fput_character_layout(of, cur_char, inl->layout, wf); |
412 |
fputs("\">",of); |
413 |
layout_stack[spans++] = cur_char; |
414 |
} |
415 |
cur_char = inl->layout; |
416 |
} |
417 |
fput_text(of, ¶->text[loc], inl->length, &wasspace); |
418 |
loc += inl->length; |
419 |
} |
420 |
|
421 |
while (spans > 0) { |
422 |
fputs("</SPAN>",of); |
423 |
spans--; |
424 |
} |
425 |
|
426 |
if (loc < strlen(para->text)) { |
427 |
fput_text(of, ¶->text[loc], strlen(para->text) - loc, &wasspace); |
428 |
} |
429 |
|
430 |
if (strlen(para->text) == 0) |
431 |
fputs(" ", of); |
432 |
|
433 |
fputs("</P>\n", of); |
434 |
free(layout_stack); |
435 |
} |
436 |
|
437 |
static void fput_style(FILE * of, |
438 |
const psiconv_word_style normal, |
439 |
const psiconv_word_style sty, |
440 |
psiconv_word_f wf) |
441 |
{ |
442 |
if (sty->name == NULL) |
443 |
fputs(" P {", of); |
444 |
else { |
445 |
fputs(" P.", of); |
446 |
fput_name(of, sty->name); |
447 |
fputs(" {", of); |
448 |
} |
449 |
fput_paragraph_layout(of, normal ? normal->paragraph : NULL, sty->paragraph); |
450 |
fput_character_layout(of, normal ? normal->character : NULL, sty->character, wf); |
451 |
fputs("}\n", of); |
452 |
} |
453 |
|
454 |
static int psiconv_gen_html4(const char *filename, const psiconv_file file, |
455 |
const char *dest) |
456 |
{ |
457 |
FILE * of; |
458 |
int i; |
459 |
psiconv_paragraph para; |
460 |
psiconv_word_style normal, sty; |
461 |
psiconv_word_f wf; |
462 |
|
463 |
if (file->type == psiconv_word_file) |
464 |
wf = file->file; |
465 |
else { |
466 |
/* Fall back on the normal HTML generator */ |
467 |
return psiconv_gen_html(filename,file,dest); |
468 |
} |
469 |
|
470 |
if (! (of = fopen(filename,"w"))) |
471 |
return -1; |
472 |
|
473 |
fputs("<!doctype html public \"-//W3C//DTD HTML 4.0 STRICT//EN\">", of); |
474 |
fputs("\n<HTML>\n<HEAD>\n <META NAME=\"GENERATOR\"", of); |
475 |
fputs(" CONTENT=\"psiconv-" VERSION "\">\n", of); |
476 |
|
477 |
if (wf->page_sec->header->text) { |
478 |
if (psiconv_list_length(wf->page_sec->header->text->paragraphs) > 0) { |
479 |
fputs(" <TITLE>", of); |
480 |
para = psiconv_list_get(wf->page_sec->header->text->paragraphs, 0); |
481 |
i = 0; |
482 |
fput_text(of, para->text, strlen(para->text), &i); |
483 |
fputs("</TITLE>\n", of); |
484 |
} |
485 |
} |
486 |
|
487 |
normal = wf->styles_sec->normal; |
488 |
fputs(" <STYLE TYPE=\"text/css\"><!--\n", of); |
489 |
fprintf(of," BODY { background-color: #%02x%02x%02x }\n", |
490 |
normal->paragraph->back_color->red, |
491 |
normal->paragraph->back_color->green, |
492 |
normal->paragraph->back_color->blue); |
493 |
fput_style(of, NULL, normal, wf); |
494 |
for (i = 0; i < psiconv_list_length(wf->styles_sec->styles); i++) { |
495 |
sty = psiconv_list_get(wf->styles_sec->styles, i); |
496 |
fput_style(of, normal, sty, wf); |
497 |
} |
498 |
fputs(" --></STYLE>\n</HEAD>\n<BODY>\n", of); |
499 |
if (wf->page_sec->header->text) { |
500 |
for (i = 0; i < psiconv_list_length(wf->paragraphs); i++) { |
501 |
para = psiconv_list_get(wf->paragraphs, i); |
502 |
fput_para(of, para, wf); |
503 |
} |
504 |
} |
505 |
fputs("</BODY>\n</HTML>\n", of); |
506 |
|
507 |
return fclose(of); |
508 |
} |
509 |
|
510 |
static struct psiconv_fileformat_s ff = |
511 |
{ |
512 |
"HTML4", |
513 |
"HTML 4.0 with cascading style sheets", |
514 |
psiconv_gen_html4 |
515 |
}; |
516 |
|
517 |
void init_html4(void) |
518 |
{ |
519 |
psiconv_list_add(fileformat_list,&ff); |
520 |
} |
521 |
|