/[public]/psiconv/trunk/program/psiconv/gen_txt.c
ViewVC logotype

Diff of /psiconv/trunk/program/psiconv/gen_txt.c

Parent Directory Parent Directory | Revision Log Revision Log | View Patch Patch

Revision 142 Revision 185
1/* 1/*
2 * gen_text.c - Part of psiconv, a PSION 5 file formats converter 2 * gen_text.c - Part of psiconv, a PSION 5 file formats converter
3 * Copyright (c) 1999 Andrew Johnson <anjohnson@iee.org> 3 * Copyright (c) 1999 Andrew Johnson <anjohnson@iee.org>
4 * Portions Copyright (c) 1999 Frodo Looijaard <frodol@dds.nl> 4 * Portions Copyright (c) 1999,2003 Frodo Looijaard <frodol@dds.nl>
5 * 5 *
6 * This program is free software; you can redistribute it and/or modify 6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License as published by 7 * it under the terms of the GNU General Public License as published by
8 * the Free Software Foundation; either version 2 of the License, or 8 * the Free Software Foundation; either version 2 of the License, or
9 * (at your option) any later version. 9 * (at your option) any later version.
19 */ 19 */
20 20
21#include "config.h" 21#include "config.h"
22#include <stdio.h> 22#include <stdio.h>
23#include <string.h> 23#include <string.h>
24#include "psiconv/data.h" 24#include <psiconv/data.h>
25#include "psiconv/list.h" 25#include <psiconv/list.h>
26#include <psiconv/unicode.h>
27#include "general.h"
26#include "gen.h" 28#include "gen.h"
27#include "psiconv.h" 29#include "psiconv.h"
28 30
29#ifdef DMALLOC 31#ifdef DMALLOC
30#include "dmalloc.h" 32#include "dmalloc.h"
31#endif 33#endif
32 34
35static void output_para(const psiconv_config config,psiconv_list list,
36 const psiconv_paragraph para,encoding encoding_type);
37static void gen_txt_word(const psiconv_config config, psiconv_list list,
38 psiconv_word_f wf, encoding encoding_type);
39static void gen_txt_texted(const psiconv_config config, psiconv_list list,
40 psiconv_texted_f tf, encoding encoding_type);
41static int gen_txt(const psiconv_config config, psiconv_list list,
42 const psiconv_file file, const char *dest,
43 const encoding encoding_type);
33 44
34/*
35 * Various string tables for HTML4 settings
36 */
37
38/* Character conversion table */
39static const char *char_table[0x100] = {
40 /* 0x00 */ "", "", "", "", "", "", "\n", "\n",
41 /* 0x08 */ "\n", "\t", "", "", "", "", "", "",
42 /* 0x10 */ " ", "", "", "", "", "", "", "",
43 /* 0x18 */ "", "", "", "", "", "", "", "",
44 /* 0x20 */ " ", "!", "\"", "#", "$", "%", "&", "'",
45 /* 0x28 */ "(", ")", "*", "+", ",", "-", ".", "/",
46 /* 0x30 */ "0", "1", "2", "3", "4", "5", "6", "7",
47 /* 0x38 */ "8", "9", ":", ";", "<", "=", ">", "?",
48 /* 0x40 */ "@", "A", "B", "C", "D", "E", "F", "G",
49 /* 0x48 */ "H", "I", "J", "K", "L", "M", "N", "O",
50 /* 0x50 */ "P", "Q", "R", "S", "T", "U", "V", "W",
51 /* 0x58 */ "X", "Y", "Z", "[", "\\", "]", "^", "_",
52 /* 0x60 */ "`", "a", "b", "c", "d", "e", "f", "g",
53 /* 0x68 */ "h", "i", "j", "k", "l", "m", "n", "o",
54 /* 0x70 */ "p", "q", "r", "s", "t", "u", "v", "w",
55 /* 0x78 */ "x", "y", "z", "{", "|", "}", "~", "",
56 /* 0x80 */ "", "", ",", "f", ",,", "...", "+", "#",
57 /* 0x88 */ "^", "\176/oo","S", "<", "OE", "", "", "",
58 /* 0x90 */ "", "`", "'", "``", "''", "*", "-", "--",
59 /* 0x98 */ "~", "(TM)", "s", ">", "oe", "", "", "Y",
60 /* 0xa0 */ "\xa0", "\xa1", "\xa2", "\xa3", "\xa4", "\xa5", "\xa6", "\xa7",
61 /* 0xa8 */ "\xa8", "\xa9", "\xaa", "\xab", "\xac", "\xad", "\xae", "\xaf",
62 /* 0xb0 */ "\xb0", "\xb1", "\xb2", "\xb3", "\xb4", "\xb5", "\xb6", "\xb7",
63 /* 0xb8 */ "\xb8", "\xb9", "\xba", "\xbb", "\xbc", "\xbd", "\xbe", "\xbf",
64 /* 0xc0 */ "\xc0", "\xc1", "\xc2", "\xc3", "\xc4", "\xc5", "\xc6", "\xc7",
65 /* 0xc8 */ "\xc8", "\xc9", "\xca", "\xcb", "\xcc", "\xcd", "\xce", "\xcf",
66 /* 0xd0 */ "\xd0", "\xd1", "\xd2", "\xd3", "\xd4", "\xd5", "\xd6", "\xd7",
67 /* 0xd8 */ "\xd8", "\xd9", "\xda", "\xdb", "\xdc", "\xdd", "\xde", "\xdf",
68 /* 0xe0 */ "\xe0", "\xe1", "\xe2", "\xe3", "\xe4", "\xe5", "\xe6", "\xe7",
69 /* 0xe8 */ "\xe8", "\xe9", "\xea", "\xeb", "\xec", "\xed", "\xee", "\xef",
70 /* 0xf0 */ "\xf0", "\xf1", "\xf2", "\xf3", "\xf4", "\xf5", "\xf6", "\xf7",
71 /* 0xf8 */ "\xf8", "\xf9", "\xfa", "\xfb", "\xfc", "\xfd", "\xfe", "\xff",
72};
73
74
75/* Output a string, doing character conversions */
76static void fput_text(FILE * of, const char *text, int length) {
77 int j;
78
79 for (j = 0; j < length; j++) {
80 fputs(char_table[(unsigned char) (text[j])], of);
81 }
82}
83
84
85/* Output a paragraph */
86static void fput_para(FILE * of,
87 const psiconv_paragraph para,int extra_nl)
88{
89 if (para->base_paragraph->bullet->on) {
90 fprintf(of, "%s ", char_table[para->base_paragraph->bullet->character]);
91 }
92 fput_text(of, para->text, strlen(para->text));
93 fputs("\n", of);
94 if (extra_nl)
95 fputs("\n", of);
96}
97
98static void psiconv_gen_txt_texted(FILE * of, psiconv_texted_f tf)
99{
100 int i;
101 psiconv_paragraph para;
102
103 if (tf->page_sec->header->text) {
104 if (tf->page_sec->header->on_first_page) {
105 for (i=0; i < psiconv_list_length(tf->page_sec->header->text->paragraphs); i++) {
106 para = psiconv_list_get(tf->page_sec->header->text->paragraphs, i);
107 fput_text(of, para->text, strlen(para->text));
108 fputs("\n", of);
109 }
110 }
111 }
112 fputs("\n",of);
113
114 for (i=0; i < psiconv_list_length(tf->texted_sec->paragraphs); i++) {
115 para = psiconv_list_get(tf->texted_sec->paragraphs, i);
116 fput_para(of, para,0);
117 }
118
119 fputs("\n",of);
120 if (tf->page_sec->header->text) {
121 for (i=0; i < psiconv_list_length(tf->page_sec->footer->text->paragraphs); i++) {
122 para = psiconv_list_get(tf->page_sec->footer->text->paragraphs, i);
123 fput_text(of, para->text, strlen(para->text));
124 fputs("\n", of);
125 }
126 }
127}
128
129static void psiconv_gen_txt_word(FILE * of, psiconv_word_f wf)
130{
131 int i;
132 psiconv_paragraph para;
133
134 if (wf->page_sec->header->on_first_page) {
135 for (i=0; i < psiconv_list_length(wf->page_sec->header->text->paragraphs); i++) {
136 para = psiconv_list_get(wf->page_sec->header->text->paragraphs, i);
137 fput_text(of, para->text, strlen(para->text));
138 fputs("\n\n", of);
139 }
140 }
141 fputs("\n\n", of);
142
143 for (i=0; i < psiconv_list_length(wf->paragraphs); i++) {
144 para = psiconv_list_get(wf->paragraphs, i);
145 fput_para(of, para,1);
146 }
147
148 fputs("\n\n", of);
149 for (i=0; i < psiconv_list_length(wf->page_sec->footer->text->paragraphs); i++) {
150 para = psiconv_list_get(wf->page_sec->footer->text->paragraphs, i);
151 fput_text(of, para->text, strlen(para->text));
152 fputs("\n\n", of);
153 }
154}
155
156static int psiconv_gen_txt(const char *filename, const psiconv_file file,
157 const char *dest)
158{
159 FILE *of = fopen(filename,"w");
160 if (! of)
161 return -1;
162
163 if (file->type == psiconv_word_file) {
164 psiconv_gen_txt_word(of,(psiconv_word_f) file->file);
165 } else if (file->type == psiconv_texted_file) {
166 psiconv_gen_txt_texted(of,(psiconv_texted_f) file->file);
167 } else {
168 fclose(of);
169 return -1;
170 }
171 return fclose(of);
172}
173
174static struct psiconv_fileformat_s ff = 45static struct fileformat_s ff =
175 { 46 {
176 "ASCII", 47 "ASCII",
177 "Plain text without much layout", 48 "Plain text without much layout",
178 psiconv_gen_txt 49 gen_txt
179 }; 50 };
180 51
52
53void output_para(const psiconv_config config,psiconv_list list,
54 const psiconv_paragraph para,encoding encoding_type)
55{
56 int i;
57 if (para && para->base_paragraph && para->base_paragraph->bullet &&
58 para->base_paragraph->bullet->on) {
59 output_char(config,list,para->base_paragraph->bullet->character,
60 encoding_type);
61 output_char(config,list,' ', encoding_type);
62 output_char(config,list,' ', encoding_type);
63 output_char(config,list,' ', encoding_type);
64 }
65 if (para && para->text) {
66 for (i = 0; i < psiconv_unicode_strlen(para->text); i++)
67 switch (para->text[i]) {
68 case 0x06:
69 case 0x07:
70 case 0x08:
71 output_char(config,list,'\n',encoding_type);
72 break;
73 case 0x09:
74 case 0x0a:
75 output_char(config,list,'\t',encoding_type);
76 break;
77 case 0x0b:
78 case 0x0c:
79 output_char(config,list,'-',encoding_type);
80 break;
81 case 0x0f:
82 output_char(config,list,' ',encoding_type);
83 break;
84 case 0x00:
85 case 0x01:
86 case 0x02:
87 case 0x03:
88 case 0x04:
89 case 0x05:
90 case 0x0e:
91 case 0x10:
92 case 0x11:
93 case 0x12:
94 case 0x13:
95 case 0x14:
96 case 0x15:
97 case 0x16:
98 case 0x17:
99 case 0x18:
100 case 0x19:
101 case 0x1a:
102 case 0x1c:
103 case 0x1d:
104 case 0x1e:
105 case 0x1f:
106 break;
107 default:
108 output_char(config,list,para->text[i],encoding_type);
109 break;
110 }
111 output_char(config,list,'\n',encoding_type);
112 }
113}
114
115void gen_txt_word(const psiconv_config config, psiconv_list list,
116 psiconv_word_f wf, encoding encoding_type)
117{
118 int i;
119 psiconv_paragraph para;
120
121 if (wf && wf->page_sec && wf->page_sec->header &&
122 wf->page_sec->header->text && wf->page_sec->header->text->paragraphs) {
123 for (i=0;
124 i < psiconv_list_length(wf->page_sec->header->
125 text->paragraphs); i++) {
126 para = psiconv_list_get(wf->page_sec->header->text->paragraphs,
127 i);
128 output_para(config,list,para,encoding_type);
129 }
130 }
131 output_char(config,list,'\n',encoding_type);
132
133 if (wf && wf->paragraphs)
134 for (i=0; i < psiconv_list_length(wf->paragraphs); i++) {
135 para = psiconv_list_get(wf->paragraphs, i);
136 output_para(config, list,para,encoding_type);
137 }
138
139 output_char(config,list,'\n',encoding_type);
140
141 if (wf && wf->page_sec && wf->page_sec->footer &&
142 wf->page_sec->footer->text && wf->page_sec->footer->text->paragraphs) {
143 for (i=0;
144 i < psiconv_list_length(wf->page_sec->footer->
145 text->paragraphs); i++) {
146 para = psiconv_list_get(wf->page_sec->footer->text->paragraphs, i);
147 output_para(config,list,para,encoding_type);
148 }
149 }
150}
151
152void gen_txt_texted(const psiconv_config config, psiconv_list list,
153 psiconv_texted_f tf, encoding encoding_type)
154{
155 int i;
156 psiconv_paragraph para;
157
158 if (tf && tf->page_sec && tf->page_sec->header &&
159 tf->page_sec->header->text && tf->page_sec->header->text->paragraphs) {
160 for (i=0;
161 i < psiconv_list_length(tf->page_sec->header->
162 text->paragraphs); i++) {
163 para = psiconv_list_get(tf->page_sec->header->text->paragraphs,
164 i);
165 output_para(config,list,para,encoding_type);
166 }
167 }
168 output_char(config,list,'\n',encoding_type);
169
170 if (tf && tf->texted_sec && tf->texted_sec->paragraphs)
171 for (i=0; i < psiconv_list_length(tf->texted_sec->paragraphs); i++) {
172 para = psiconv_list_get(tf->texted_sec->paragraphs, i);
173 output_para(config, list,para,encoding_type);
174 }
175
176 output_char(config,list,'\n',encoding_type);
177
178 if (tf && tf->page_sec && tf->page_sec->footer &&
179 tf->page_sec->footer->text && tf->page_sec->footer->text->paragraphs) {
180 for (i=0;
181 i < psiconv_list_length(tf->page_sec->footer->
182 text->paragraphs); i++) {
183 para = psiconv_list_get(tf->page_sec->footer->text->paragraphs, i);
184 output_para(config,list,para,encoding_type);
185 }
186 }
187}
188
189int gen_txt(const psiconv_config config, psiconv_list list,
190 const psiconv_file file, const char *dest,
191 const encoding encoding_type)
192{
193 if (file->type == psiconv_word_file) {
194 gen_txt_word(config,list,(psiconv_word_f) file->file,encoding_type);
195 return 0;
196 } else if (file->type == psiconv_texted_file) {
197 gen_txt_texted(config,list,(psiconv_texted_f) file->file,encoding_type);
198 return 0;
199 } else
200 return -1;
201}
202
181void init_txt(void) 203void init_txt(void)
182{ 204{
183 psiconv_list_add(fileformat_list,&ff); 205 psiconv_list_add(fileformat_list,&ff);
184} 206}
185 207

Legend:
Removed from v.142  
changed lines
  Added in v.185

frodo@frodo.looijaard.name
ViewVC Help
Powered by ViewVC 1.1.26