1 | /* |
---|
2 | * man2tcl.c -- |
---|
3 | * |
---|
4 | * This file contains a program that turns a man page of the form used |
---|
5 | * for Tcl and Tk into a Tcl script that invokes a Tcl command for each |
---|
6 | * construct in the man page. The script can then be eval'ed to translate |
---|
7 | * the manual entry into some other format such as MIF or HTML. |
---|
8 | * |
---|
9 | * Usage: |
---|
10 | * |
---|
11 | * man2tcl ?fileName? |
---|
12 | * |
---|
13 | * Copyright (c) 1995 Sun Microsystems, Inc. |
---|
14 | * |
---|
15 | * See the file "license.terms" for information on usage and redistribution of |
---|
16 | * this file, and for a DISCLAIMER OF ALL WARRANTIES. |
---|
17 | * |
---|
18 | * RCS: @(#) $Id: man2tcl.c,v 1.13 2007/12/13 15:28:40 dgp Exp $ |
---|
19 | */ |
---|
20 | |
---|
21 | static char sccsid[] = "@(#) man2tcl.c 1.3 95/08/12 17:34:08"; |
---|
22 | |
---|
23 | #include <stdio.h> |
---|
24 | #include <stdlib.h> |
---|
25 | #include <string.h> |
---|
26 | #include <ctype.h> |
---|
27 | #include <errno.h> |
---|
28 | |
---|
29 | /* |
---|
30 | * Imported things that aren't defined in header files: |
---|
31 | */ |
---|
32 | |
---|
33 | /* |
---|
34 | * Some <errno.h> define errno to be something complex and thread-aware; in |
---|
35 | * that case we definitely do not want to declare errno ourselves! |
---|
36 | */ |
---|
37 | |
---|
38 | #ifndef errno |
---|
39 | extern int errno; |
---|
40 | #endif |
---|
41 | |
---|
42 | /* |
---|
43 | * Current line number, used for error messages. |
---|
44 | */ |
---|
45 | |
---|
46 | static int lineNumber; |
---|
47 | |
---|
48 | /* |
---|
49 | * The variable below is set to 1 if an error occurs anywhere while reading in |
---|
50 | * the file. |
---|
51 | */ |
---|
52 | |
---|
53 | static int status; |
---|
54 | |
---|
55 | /* |
---|
56 | * The variable below is set to 1 if output should be generated. If it's 0, it |
---|
57 | * means we're doing a pre-pass to make sure that the file can be properly |
---|
58 | * parsed. |
---|
59 | */ |
---|
60 | |
---|
61 | static int writeOutput; |
---|
62 | |
---|
63 | #define PRINT(args) if (writeOutput) { printf args; } |
---|
64 | #define PRINTC(chr) if (writeOutput) { putc((chr), stdout); } |
---|
65 | |
---|
66 | /* |
---|
67 | * Prototypes for functions defined in this file: |
---|
68 | */ |
---|
69 | |
---|
70 | static void DoMacro(char *line); |
---|
71 | static void DoText(char *line); |
---|
72 | static void QuoteText(char *string, int count); |
---|
73 | |
---|
74 | /* |
---|
75 | *---------------------------------------------------------------------- |
---|
76 | * |
---|
77 | * main -- |
---|
78 | * |
---|
79 | * This function is the main program, which does all of the work of the |
---|
80 | * program. |
---|
81 | * |
---|
82 | * Results: |
---|
83 | * None: exits with a 0 return status to indicate success, or 1 to |
---|
84 | * indicate that there were problems in the translation. |
---|
85 | * |
---|
86 | * Side effects: |
---|
87 | * A Tcl script is output to standard output. Error messages may be |
---|
88 | * output on standard error. |
---|
89 | * |
---|
90 | *---------------------------------------------------------------------- |
---|
91 | */ |
---|
92 | |
---|
93 | int |
---|
94 | main( |
---|
95 | int argc, /* Number of command-line arguments. */ |
---|
96 | char **argv) /* Values of command-line arguments. */ |
---|
97 | { |
---|
98 | FILE *f; |
---|
99 | #define MAX_LINE_SIZE 1000 |
---|
100 | char line[MAX_LINE_SIZE]; |
---|
101 | char *p; |
---|
102 | |
---|
103 | /* |
---|
104 | * Find the file to read, and open it if it isn't stdin. |
---|
105 | */ |
---|
106 | |
---|
107 | if (argc == 1) { |
---|
108 | f = stdin; |
---|
109 | } else if (argc == 2) { |
---|
110 | f = fopen(argv[1], "r"); |
---|
111 | if (f == NULL) { |
---|
112 | fprintf(stderr, "Couldn't read \"%s\": %s\n", argv[1], |
---|
113 | strerror(errno)); |
---|
114 | exit(1); |
---|
115 | } |
---|
116 | } else { |
---|
117 | fprintf(stderr, "Usage: %s ?fileName?\n", argv[0]); |
---|
118 | } |
---|
119 | |
---|
120 | /* |
---|
121 | * Make two passes over the file. In the first pass, just check to make |
---|
122 | * sure we can handle everything. If there are problems, generate output |
---|
123 | * and stop. If everything is OK, make a second pass to actually generate |
---|
124 | * output. |
---|
125 | */ |
---|
126 | |
---|
127 | for (writeOutput = 0; writeOutput < 2; writeOutput++) { |
---|
128 | lineNumber = 0; |
---|
129 | status = 0; |
---|
130 | while (fgets(line, MAX_LINE_SIZE, f) != NULL) { |
---|
131 | for (p = line; *p != 0; p++) { |
---|
132 | if (*p == '\n') { |
---|
133 | *p = 0; |
---|
134 | break; |
---|
135 | } |
---|
136 | } |
---|
137 | lineNumber++; |
---|
138 | |
---|
139 | if (((line[0] == '.') || (line[0] == '\'')) && (line[1] == '\\') && (line[2] == '\"')) { |
---|
140 | /* |
---|
141 | * This line is a comment. Ignore it. |
---|
142 | */ |
---|
143 | |
---|
144 | continue; |
---|
145 | } |
---|
146 | |
---|
147 | if (strlen(line) >= MAX_LINE_SIZE -1) { |
---|
148 | fprintf(stderr, "Too long line. Max is %d chars.\n", |
---|
149 | MAX_LINE_SIZE - 1); |
---|
150 | exit(1); |
---|
151 | } |
---|
152 | |
---|
153 | if ((line[0] == '.') || (line[0] == '\'')) { |
---|
154 | /* |
---|
155 | * This line is a macro invocation. |
---|
156 | */ |
---|
157 | |
---|
158 | DoMacro(line); |
---|
159 | } else { |
---|
160 | /* |
---|
161 | * This line is text, possibly with formatting characters |
---|
162 | * embedded in it. |
---|
163 | */ |
---|
164 | |
---|
165 | DoText(line); |
---|
166 | } |
---|
167 | } |
---|
168 | if (status != 0) { |
---|
169 | break; |
---|
170 | } |
---|
171 | fseek(f, 0, SEEK_SET); |
---|
172 | } |
---|
173 | exit(status); |
---|
174 | } |
---|
175 | |
---|
176 | /* |
---|
177 | *---------------------------------------------------------------------- |
---|
178 | * |
---|
179 | * DoMacro -- |
---|
180 | * |
---|
181 | * This function is called to handle a macro invocation. It parses the |
---|
182 | * arguments to the macro and generates a Tcl command to handle the |
---|
183 | * invocation. |
---|
184 | * |
---|
185 | * Results: |
---|
186 | * None. |
---|
187 | * |
---|
188 | * Side effects: |
---|
189 | * A Tcl command is written to stdout. |
---|
190 | * |
---|
191 | *---------------------------------------------------------------------- |
---|
192 | */ |
---|
193 | |
---|
194 | static void |
---|
195 | DoMacro( |
---|
196 | char *line) /* The line of text that contains the macro |
---|
197 | * invocation. */ |
---|
198 | { |
---|
199 | char *p, *end; |
---|
200 | |
---|
201 | /* |
---|
202 | * If there is no macro name, then just skip the whole line. |
---|
203 | */ |
---|
204 | |
---|
205 | if ((line[1] == 0) || (isspace(line[1]))) { |
---|
206 | return; |
---|
207 | } |
---|
208 | |
---|
209 | PRINT(("macro")); |
---|
210 | if (*line != '.') { |
---|
211 | PRINT(("2")); |
---|
212 | } |
---|
213 | |
---|
214 | /* |
---|
215 | * Parse the arguments to the macro (including the name), in order. |
---|
216 | */ |
---|
217 | |
---|
218 | p = line+1; |
---|
219 | while (1) { |
---|
220 | PRINTC(' '); |
---|
221 | if (*p == '"') { |
---|
222 | /* |
---|
223 | * The argument is delimited by quotes. |
---|
224 | */ |
---|
225 | |
---|
226 | for (end = p+1; *end != '"'; end++) { |
---|
227 | if (*end == 0) { |
---|
228 | fprintf(stderr, |
---|
229 | "Unclosed quote in macro call on line %d.\n", |
---|
230 | lineNumber); |
---|
231 | status = 1; |
---|
232 | break; |
---|
233 | } |
---|
234 | } |
---|
235 | QuoteText(p+1, (end-(p+1))); |
---|
236 | } else { |
---|
237 | for (end = p+1; (*end != 0) && !isspace(*end); end++) { |
---|
238 | /* Empty loop body. */ |
---|
239 | } |
---|
240 | QuoteText(p, end-p); |
---|
241 | } |
---|
242 | if (*end == 0) { |
---|
243 | break; |
---|
244 | } |
---|
245 | p = end+1; |
---|
246 | while (isspace(*p)) { |
---|
247 | /* |
---|
248 | * Skip empty space before next argument. |
---|
249 | */ |
---|
250 | |
---|
251 | p++; |
---|
252 | } |
---|
253 | if (*p == 0) { |
---|
254 | break; |
---|
255 | } |
---|
256 | } |
---|
257 | PRINTC('\n'); |
---|
258 | } |
---|
259 | |
---|
260 | /* |
---|
261 | *---------------------------------------------------------------------- |
---|
262 | * |
---|
263 | * DoText -- |
---|
264 | * |
---|
265 | * This function is called to handle a line of troff text. It parses the |
---|
266 | * text, generating Tcl commands for text and for formatting stuff such |
---|
267 | * as font changes. |
---|
268 | * |
---|
269 | * Results: |
---|
270 | * None. |
---|
271 | * |
---|
272 | * Side effects: |
---|
273 | * Tcl commands are written to stdout. |
---|
274 | * |
---|
275 | *---------------------------------------------------------------------- |
---|
276 | */ |
---|
277 | |
---|
278 | static void |
---|
279 | DoText( |
---|
280 | char *line) /* The line of text. */ |
---|
281 | { |
---|
282 | char *p, *end; |
---|
283 | |
---|
284 | /* |
---|
285 | * Divide the line up into pieces consisting of backslash sequences, tabs, |
---|
286 | * and other text. |
---|
287 | */ |
---|
288 | |
---|
289 | p = line; |
---|
290 | while (*p != 0) { |
---|
291 | if (*p == '\t') { |
---|
292 | PRINT(("tab\n")); |
---|
293 | p++; |
---|
294 | } else if (*p != '\\') { |
---|
295 | /* |
---|
296 | * Ordinary text. |
---|
297 | */ |
---|
298 | |
---|
299 | for (end = p+1; (*end != '\\') && (*end != 0); end++) { |
---|
300 | /* Empty loop body. */ |
---|
301 | } |
---|
302 | PRINT(("text ")); |
---|
303 | QuoteText(p, end-p); |
---|
304 | PRINTC('\n'); |
---|
305 | p = end; |
---|
306 | } else { |
---|
307 | /* |
---|
308 | * A backslash sequence. There are particular ones that we |
---|
309 | * understand; output an error message for anything else and just |
---|
310 | * ignore the backslash. |
---|
311 | */ |
---|
312 | |
---|
313 | p++; |
---|
314 | if (*p == 'f') { |
---|
315 | /* |
---|
316 | * Font change. |
---|
317 | */ |
---|
318 | |
---|
319 | PRINT(("font %c\n", p[1])); |
---|
320 | p += 2; |
---|
321 | } else if (*p == '-') { |
---|
322 | PRINT(("dash\n")); |
---|
323 | p++; |
---|
324 | } else if (*p == 'e') { |
---|
325 | PRINT(("text \\\\\n")); |
---|
326 | p++; |
---|
327 | } else if (*p == '.') { |
---|
328 | PRINT(("text .\n")); |
---|
329 | p++; |
---|
330 | } else if (*p == '&') { |
---|
331 | p++; |
---|
332 | } else if (*p == '0') { |
---|
333 | PRINT(("text { }\n")); |
---|
334 | p++; |
---|
335 | } else if (*p == '(') { |
---|
336 | if ((p[1] == 0) || (p[2] == 0)) { |
---|
337 | fprintf(stderr, "Bad \\( sequence on line %d.\n", |
---|
338 | lineNumber); |
---|
339 | status = 1; |
---|
340 | } else { |
---|
341 | PRINT(("char {\\(%c%c}\n", p[1], p[2])); |
---|
342 | p += 3; |
---|
343 | } |
---|
344 | } else if (*p == 'N' && *(p+1) == '\'') { |
---|
345 | int ch; |
---|
346 | |
---|
347 | p += 2; |
---|
348 | sscanf(p,"%d",&ch); |
---|
349 | PRINT(("text \\u%04x", ch)); |
---|
350 | while(*p&&*p!='\'') p++; |
---|
351 | } else if (*p != 0) { |
---|
352 | PRINT(("char {\\%c}\n", *p)); |
---|
353 | p++; |
---|
354 | } |
---|
355 | } |
---|
356 | } |
---|
357 | PRINT(("newline\n")); |
---|
358 | } |
---|
359 | |
---|
360 | /* |
---|
361 | *---------------------------------------------------------------------- |
---|
362 | * |
---|
363 | * QuoteText -- |
---|
364 | * |
---|
365 | * Copy the "string" argument to stdout, adding quote characters around |
---|
366 | * any special Tcl characters so that they'll just be treated as ordinary |
---|
367 | * text. |
---|
368 | * |
---|
369 | * Results: |
---|
370 | * None. |
---|
371 | * |
---|
372 | * Side effects: |
---|
373 | * Text is written to stdout. |
---|
374 | * |
---|
375 | *---------------------------------------------------------------------- |
---|
376 | */ |
---|
377 | |
---|
378 | static void |
---|
379 | QuoteText( |
---|
380 | char *string, /* The line of text. */ |
---|
381 | int count) /* Number of characters to write from |
---|
382 | * string. */ |
---|
383 | { |
---|
384 | if (count == 0) { |
---|
385 | PRINT(("{}")); |
---|
386 | return; |
---|
387 | } |
---|
388 | for ( ; count > 0; string++, count--) { |
---|
389 | switch (*string) { |
---|
390 | case '\\': |
---|
391 | if (*(string+1) == 'N' && *(string+2) == '\'') { |
---|
392 | int ch; |
---|
393 | |
---|
394 | string += 3; |
---|
395 | count -= 3; |
---|
396 | sscanf(string,"%d",&ch); |
---|
397 | PRINT(("\\u%04x", ch)); |
---|
398 | while(count>0&&*string!='\'') {string++;count--;} |
---|
399 | continue; |
---|
400 | } else if (*(string+1) == '0') { |
---|
401 | PRINT(("\\ ")); |
---|
402 | string++; |
---|
403 | count--; |
---|
404 | continue; |
---|
405 | } |
---|
406 | case '$': case '[': case '{': case ' ': case ';': |
---|
407 | case '"': case '\t': |
---|
408 | PRINTC('\\'); |
---|
409 | default: |
---|
410 | PRINTC(*string); |
---|
411 | } |
---|
412 | } |
---|
413 | } |
---|
414 | |
---|
415 | /* |
---|
416 | * Local Variables: |
---|
417 | * mode: c |
---|
418 | * c-basic-offset: 4 |
---|
419 | * fill-column: 78 |
---|
420 | * End: |
---|
421 | */ |
---|