/[public]/psiconv/trunk/program/psiconv/gen_html.c
ViewVC logotype

Diff of /psiconv/trunk/program/psiconv/gen_html.c

Parent Directory Parent Directory | Revision Log Revision Log | View Patch Patch

Revision 20 Revision 147
14 14
15 You should have received a copy of the GNU General Public License 15 You should have received a copy of the GNU General Public License
16 along with this program; if not, write to the Free Software 16 along with this program; if not, write to the Free Software
17 Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. 17 Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
18*/ 18*/
19/*
20 2002/Apr. Keita KAWABE
21 A: <META HTTP-EQUIV="Content-Type" CONTENT="text/html"> header
22 was added.
23
24 B: Support for narrow build Asian Psions added.
25 If the encoding_type is PSICONV_ENCODING_UTF8,
26 B-1: use utf8_table for character conversion.
27 B-2: add the "Charset=UTF-8" in the Content-Type header.
28 Otherwise proceed as normal.
29*/
19 30
20#include "config.h" 31#include "config.h"
21#include <stdio.h> 32#include <stdio.h>
22#include <string.h> 33#include <string.h>
23#include <stdlib.h> 34#include <stdlib.h>
24#include "data.h" 35#include "psiconv/data.h"
25#include "list.h" 36#include "psiconv/list.h"
26#include "gen.h" 37#include "gen.h"
38#include "psiconv.h"
39
40#ifdef DMALLOC
41#include "dmalloc.h"
42#endif
27 43
28/* This determines for each character how it is displayed */ 44/* This determines for each character how it is displayed */
29static const char *char_table[0x100] = 45static const char *char_table[0x100] =
30{ 46{
31 /* 0x00 */ "" ,"" ,"" ,"" ,"" ,"" ,"<P> ","<BR>" , 47 /* 0x00 */ "" ,"" ,"" ,"" ,"" ,"" ,"<P> ","<BR>" ,
73 "&ocirc;","&otilde;","&ouml;","&divide;", 89 "&ocirc;","&otilde;","&ouml;","&divide;",
74 /* 0xf8 */ "&oslash;","&ugrave;","&uacute;","&ucirc;", 90 /* 0xf8 */ "&oslash;","&ugrave;","&uacute;","&ucirc;",
75 "&uuml;","&yacute;","&thorn;","&yuml;" 91 "&uuml;","&yacute;","&thorn;","&yuml;"
76}; 92};
77 93
94static const char *utf_table[0x100] =
95{
96 /* 0x00 */ "" ,"" ,"" ,"" ,"" ,"" ,"<P> ","<BR>" ,
97 /* 0x08 */ "<P>" ," " ,"" ,"" ,"" ,"" ,"" ,"" ,
98 /* 0x10 */ " " ,"" ,"" ,"" ,"" ,"" ,"" ,"" ,
99 /* 0x18 */ "" ,"" ,"" ,"" ,"" ,"" ,"" ,"" ,
100 /* 0x20 */ " " ,"!" ,"&quot;","#" ,"$" ,"%" ,"&amp;","'" ,
101 /* 0x28 */ "(" ,")" ,"*" ,"+" ,"," ,"-" ,"." ,"/" ,
102 /* 0x30 */ "0" ,"1" ,"2" ,"3" ,"4" ,"5" ,"6" ,"7" ,
103 /* 0x38 */ "8" ,"9" ,":" ,";" ,"&lt;" ,"=" ,"&gt;" ,"?" ,
104 /* 0x40 */ "@" ,"A" ,"B" ,"C" ,"D" ,"E" ,"F" ,"G" ,
105 /* 0x48 */ "H" ,"I" ,"J" ,"K" ,"L" ,"M" ,"N" ,"O" ,
106 /* 0x50 */ "P" ,"Q" ,"R" ,"S" ,"T" ,"U" ,"V" ,"W" ,
107 /* 0x58 */ "X" ,"Y" ,"Z" ,"[" ,"\\" ,"]" ,"^" ,"_" ,
108 /* 0x60 */ "`" ,"a" ,"b" ,"c" ,"d" ,"e" ,"f" ,"g" ,
109 /* 0x68 */ "h" ,"i" ,"j" ,"k" ,"l" ,"m" ,"n" ,"o" ,
110 /* 0x70 */ "p" ,"q" ,"r" ,"s" ,"t" ,"u" ,"v" ,"w" ,
111 /* 0x78 */ "x" ,"y" ,"z" ,"{" ,"|" ,"}" ,"~" ,"" ,
112 /* 0x80 */ "\x80", "\x81", "\x82", "\x83", "\x84", "\x85", "\x86", "\x87",
113 /* 0x88 */ "\x88", "\x89", "\x8a", "\x8b", "\x8c", "\x8d", "\x8e", "\x8f",
114 /* 0x90 */ "\x90", "\x91", "\x92", "\x93", "\x94", "\x95", "\x96", "\x97",
115 /* 0x98 */ "\x98", "\x99", "\x9a", "\x9b", "\x9c", "\x9d", "\x9e", "\x9f",
116 /* 0xa0 */ "\xa0", "\xa1", "\xa2", "\xa3", "\xa4", "\xa5", "\xa6", "\xa7",
117 /* 0xa8 */ "\xa8", "\xa9", "\xaa", "\xab", "\xac", "\xad", "\xae", "\xaf",
118 /* 0xb0 */ "\xb0", "\xb1", "\xb2", "\xb3", "\xb4", "\xb5", "\xb6", "\xb7",
119 /* 0xb8 */ "\xb8", "\xb9", "\xba", "\xbb", "\xbc", "\xbd", "\xbe", "\xbf",
120 /* 0xc0 */ "\xc0", "\xc1", "\xc2", "\xc3", "\xc4", "\xc5", "\xc6", "\xc7",
121 /* 0xc8 */ "\xc8", "\xc9", "\xca", "\xcb", "\xcc", "\xcd", "\xce", "\xcf",
122 /* 0xd0 */ "\xd0", "\xd1", "\xd2", "\xd3", "\xd4", "\xd5", "\xd6", "\xd7",
123 /* 0xd8 */ "\xd8", "\xd9", "\xda", "\xdb", "\xdc", "\xdd", "\xde", "\xdf",
124 /* 0xe0 */ "\xe0", "\xe1", "\xe2", "\xe3", "\xe4", "\xe5", "\xe6", "\xe7",
125 /* 0xe8 */ "\xe8", "\xe9", "\xea", "\xeb", "\xec", "\xed", "\xee", "\xef",
126 /* 0xf0 */ "\xf0", "\xf1", "\xf2", "\xf3", "\xf4", "\xf5", "\xf6", "\xf7",
127 /* 0xf8 */ "\xf8", "\xf9", "\xfa", "\xfb", "\xfc", "\xfd", "\xfe", "\xff",
128};
129
130/* a flag to indicate the use of UTF8 */
131static psiconv_encoding encoding= PSICONV_ENCODING_CP1252;
132
78static psiconv_character_layout gen_base_char(const psiconv_font font, 133static psiconv_character_layout gen_base_char(const psiconv_font font,
79 const psiconv_color color, 134 const psiconv_color color,
80 const psiconv_color back_color); 135 const psiconv_color back_color);
81static void diff_char(FILE *of, const psiconv_character_layout old, 136static void diff_char(FILE *of, const psiconv_character_layout old,
82 const psiconv_character_layout new, int *flags); 137 const psiconv_character_layout new, int *flags);
90 This one is specific for the base point of HTML */ 145 This one is specific for the base point of HTML */
91psiconv_character_layout gen_base_char(const psiconv_font font, 146psiconv_character_layout gen_base_char(const psiconv_font font,
92 const psiconv_color color, 147 const psiconv_color color,
93 const psiconv_color back_color) 148 const psiconv_color back_color)
94{ 149{
95 struct psiconv_character_layout base_char_struct = 150 struct psiconv_character_layout_s base_char_struct =
96 { 151 {
97 NULL, /* color */ 152 NULL, /* color */
98 NULL, /* back_color */ 153 NULL, /* back_color */
99 13.0, /* font_size */ 154 13.0, /* font_size */
100 psiconv_bool_false, /* italic */ 155 psiconv_bool_false, /* italic */
101 psiconv_bool_false, /* bold */ 156 psiconv_bool_false, /* bold */
102 psiconv_normalscript, /* super_sub */ 157 psiconv_normalscript, /* super_sub */
103 psiconv_bool_false, /* underline */ 158 psiconv_bool_false, /* underline */
104 psiconv_bool_false, /* strike_out */ 159 psiconv_bool_false, /* strikethrough */
105 NULL, /* font */ 160 NULL, /* font */
106 }; 161 };
107 base_char_struct.color = color; 162 base_char_struct.color = color;
108 base_char_struct.back_color = back_color; 163 base_char_struct.back_color = back_color;
109 base_char_struct.font = font; 164 base_char_struct.font = font;
130 fputs("</I>",of); 185 fputs("</I>",of);
131 if (old->bold) 186 if (old->bold)
132 fputs("</B>",of); 187 fputs("</B>",of);
133 if (old->underline) 188 if (old->underline)
134 fputs("</U>",of); 189 fputs("</U>",of);
135 if (old->strike_out) 190 if (old->strikethrough)
136 fputs("</STRIKE>",of); 191 fputs("</STRIKE>",of);
137 if (old->super_sub == psiconv_superscript) 192 if (old->super_sub == psiconv_superscript)
138 fputs("</SUP>",of); 193 fputs("</SUP>",of);
139 if (old->super_sub == psiconv_subscript) 194 if (old->super_sub == psiconv_subscript)
140 fputs("</SUB>",of); 195 fputs("</SUB>",of);
157 fputs("6",of); 212 fputs("6",of);
158 else 213 else
159 fputs("7",of); 214 fputs("7",of);
160 fprintf(of," COLOR=#%02x%02x%02x",new->color->red,new->color->green, 215 fprintf(of," COLOR=#%02x%02x%02x",new->color->red,new->color->green,
161 new->color->blue); 216 new->color->blue);
162 if (new->font->screenfont == 1) 217 if (new->font->screenfont == psiconv_font_sansserif)
163 fprintf(of," FACE=\"%s, Sans-Serif\">",new->font->name); 218 fprintf(of," FACE=\"%s, Sans-Serif\">",new->font->name);
164 else if (new->font->screenfont == 2) 219 else if (new->font->screenfont == psiconv_font_nonprop)
165 fprintf(of," FACE=\"%s, Monospace\">",new->font-> name); 220 fprintf(of," FACE=\"%s, Monospace\">",new->font-> name);
166 else if (new->font->screenfont == 3) 221 else if (new->font->screenfont == psiconv_font_serif)
167 fprintf(of," FACE=\"%s, Serif\">",new->font-> name); 222 fprintf(of," FACE=\"%s, Serif\">",new->font-> name);
168 else 223 else
169 fprintf(of," FACE=\"%s, Serif\">",new->font-> name); 224 fprintf(of," FACE=\"%s, Serif\">",new->font-> name);
170 } 225 }
171 if (new->italic) 226 if (new->italic)
172 fputs("<I>",of); 227 fputs("<I>",of);
173 if (new->bold) 228 if (new->bold)
174 fputs("<B>",of); 229 fputs("<B>",of);
175 if (new->underline) 230 if (new->underline)
176 fputs("<U>",of); 231 fputs("<U>",of);
177 if (new->strike_out) 232 if (new->strikethrough)
178 fputs("<STRIKE>",of); 233 fputs("<STRIKE>",of);
179 if (new->super_sub == psiconv_superscript) 234 if (new->super_sub == psiconv_superscript)
180 fputs("<SUP>",of); 235 fputs("<SUP>",of);
181 if (new->super_sub == psiconv_subscript) 236 if (new->super_sub == psiconv_subscript)
182 fputs("<SUB>",of); 237 fputs("<SUB>",of);
197 if (old->underline) 252 if (old->underline)
198 fputs("</U>",of); 253 fputs("</U>",of);
199 else 254 else
200 fputs("<U>",of); 255 fputs("<U>",of);
201 } 256 }
202 if (old->strike_out != new->strike_out) { 257 if (old->strikethrough != new->strikethrough) {
203 if (old->strike_out) 258 if (old->strikethrough)
204 fputs("</STRIKE>",of); 259 fputs("</STRIKE>",of);
205 else 260 else
206 fputs("<STRIKE>",of); 261 fputs("<STRIKE>",of);
207 } 262 }
208 if (old->super_sub != new->super_sub) { 263 if (old->super_sub != new->super_sub) {
223{ 278{
224 int i,j,loc; 279 int i,j,loc;
225 psiconv_character_layout cur_char; 280 psiconv_character_layout cur_char;
226 psiconv_in_line_layout inl; 281 psiconv_in_line_layout inl;
227 int flags = 0; 282 int flags = 0;
283
284 char **table;
285 if (encoding == PSICONV_ENCODING_UTF8){
286 table=(char**)utf_table;
287 }else{
288 table=(char**)char_table;
289 }
290
228 291
229 292
230 fputs("<P",of); 293 fputs("<P",of);
231 if (para->base_paragraph->justify_hor == psiconv_justify_left) 294 if (para->base_paragraph->justify_hor == psiconv_justify_left)
232 fputs(" ALIGN=left",of); 295 fputs(" ALIGN=left",of);
251 for (i = 0; i < psiconv_list_length(para->in_lines); i++) { 314 for (i = 0; i < psiconv_list_length(para->in_lines); i++) {
252 inl = psiconv_list_get(para->in_lines,i); 315 inl = psiconv_list_get(para->in_lines,i);
253 diff_char(of,cur_char,inl->layout,&flags); 316 diff_char(of,cur_char,inl->layout,&flags);
254 cur_char = inl->layout; 317 cur_char = inl->layout;
255 for (j = loc; j < inl->length + loc; j ++) { 318 for (j = loc; j < inl->length + loc; j ++) {
256 fputs(char_table[(unsigned char) (para->text[j])],of); 319 fputs(table[(unsigned char) (para->text[j])],of);
257 } 320 }
258 loc = j; 321 loc = j;
259 } 322 }
260 323
261 if (loc < strlen(para->text)) { 324 if (loc < strlen(para->text)) {
262 diff_char(of,cur_char,para->base_character,&flags); 325 diff_char(of,cur_char,para->base_character,&flags);
263 cur_char = para->base_character; 326 cur_char = para->base_character;
264 for (j = loc; j < strlen(para->text); j ++) { 327 for (j = loc; j < strlen(para->text); j ++) {
265 fputs(char_table[(unsigned char) (para->text[j])],of); 328 fputs(table[(unsigned char) (para->text[j])],of);
266 } 329 }
267 } 330 }
268 331
269 if (strlen(para->text) == 0) 332 if (strlen(para->text) == 0)
270 fputs("<BR>",of); 333 fputs("<BR>",of);
276 fputs("</UL>",of); 339 fputs("</UL>",of);
277 340
278 fputs("</P>\n",of); 341 fputs("</P>\n",of);
279} 342}
280 343
281void psiconv_gen_html(FILE *of,psiconv_file file) 344int psiconv_gen_html(const char * filename,const psiconv_file file,
345 const char *dest, const psiconv_encoding encoding_type)
282{ 346{
347 FILE *of = fopen(filename,"w");
348 if (! of)
349 return -1;
350
351 encoding = encoding_type;
352
283 if (file->type == psiconv_word_file) 353 if (file->type == psiconv_word_file) {
284 psiconv_gen_html_word(of,(psiconv_word_f) file->file); 354 psiconv_gen_html_word(of,(psiconv_word_f) file->file);
285 else if (file->type == psiconv_texted_file) 355 } else if (file->type == psiconv_texted_file) {
286 psiconv_gen_html_texted(of,(psiconv_texted_f) file->file); 356 psiconv_gen_html_texted(of,(psiconv_texted_f) file->file);
287 else 357 } else {
358 fclose(of);
288 return; 359 return -1;
360 }
361 return fclose(of);
289} 362}
290 363
291void psiconv_gen_html_texted(FILE *of,psiconv_texted_f tf) 364void psiconv_gen_html_texted(FILE *of,psiconv_texted_f tf)
292{ 365{
293 psiconv_character_layout base_char; 366 psiconv_character_layout base_char;
298 base_char = psiconv_basic_character_layout(); 371 base_char = psiconv_basic_character_layout();
299 372
300 fputs("<!doctype html public \"-//W3C//DTD HTML 3.2 Final//EN\">", of); 373 fputs("<!doctype html public \"-//W3C//DTD HTML 3.2 Final//EN\">", of);
301 fputs("\n<HTML>\n<HEAD>\n <META NAME=\"GENERATOR\"", of); 374 fputs("\n<HTML>\n<HEAD>\n <META NAME=\"GENERATOR\"", of);
302 fputs(" CONTENT=\"psiconv-" VERSION "\">\n", of); 375 fputs(" CONTENT=\"psiconv-" VERSION "\">\n", of);
376
377 fputs(" <META HTTP-EQUIV=\"Content-Type\" CONTENT=\"text/html", of);
378 if (encoding == PSICONV_ENCODING_UTF8){
379 fputs("; CHARSET=UTF-8", of);
380 }
381 fputs("\">\n", of);
382
383 fputs("</HEAD>\n",of);
303 fputs("<BODY>\n",of); 384 fputs("<BODY>\n",of);
304 for (i = 0; i < psiconv_list_length(tf->texted_sec->paragraphs); i++) { 385 for (i = 0; i < psiconv_list_length(tf->texted_sec->paragraphs); i++) {
305 para = psiconv_list_get(tf->texted_sec->paragraphs,i); 386 para = psiconv_list_get(tf->texted_sec->paragraphs,i);
306 gen_para(of,para,base_char); 387 gen_para(of,para,base_char);
307 } 388 }
334 psiconv_free_color(white); 415 psiconv_free_color(white);
335 416
336 fputs("<!doctype html public \"-//W3C//DTD HTML 3.2 Final//EN\">", of); 417 fputs("<!doctype html public \"-//W3C//DTD HTML 3.2 Final//EN\">", of);
337 fputs("\n<HTML>\n<HEAD>\n <META NAME=\"GENERATOR\"", of); 418 fputs("\n<HTML>\n<HEAD>\n <META NAME=\"GENERATOR\"", of);
338 fputs(" CONTENT=\"psiconv-" VERSION "\">\n", of); 419 fputs(" CONTENT=\"psiconv-" VERSION "\">\n", of);
420
421 fputs(" <META HTTP-EQUIV=\"Content-Type\" CONTENT=\"text/html", of);
422 if (encoding == PSICONV_ENCODING_UTF8)
423 fputs("; CHARSET=UTF-8", of);
424 fputs("\">\n", of);
425
426 fputs("</HEAD>\n",of);
339 fputs("<BODY>\n",of); 427 fputs("<BODY>\n",of);
340 428
341 for (i = 0; i < psiconv_list_length(wf->paragraphs); i++) { 429 for (i = 0; i < psiconv_list_length(wf->paragraphs); i++) {
342 para = psiconv_list_get(wf->paragraphs,i); 430 para = psiconv_list_get(wf->paragraphs,i);
343 gen_para(of,para,base_char); 431 gen_para(of,para,base_char);
344 } 432 }
345 fputs("</BODY>\n</HTML>\n",of); 433 fputs("</BODY>\n</HTML>\n",of);
346 psiconv_free_character_layout(base_char); 434 psiconv_free_character_layout(base_char);
347} 435}
348 436
437static struct psiconv_fileformat_s ff =
438 {
439 "HTML3",
440 "HTML 3.2, not verified so probably not completely compliant",
441 &psiconv_gen_html
442 };
349 443
444void init_html(void)
445{
446 psiconv_list_add(fileformat_list,&ff);
447}

Legend:
Removed from v.20  
changed lines
  Added in v.147

frodo@frodo.looijaard.name
ViewVC Help
Powered by ViewVC 1.1.26