OpenSolaris_b135/cmd/sunpc/other/dos2unix.c

Compare this file to the similar file:
Show the results in this format:

/*
 * CDDL HEADER START
 *
 * The contents of this file are subject to the terms of the
 * Common Development and Distribution License, Version 1.0 only
 * (the "License").  You may not use this file except in compliance
 * with the License.
 *
 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
 * or http://www.opensolaris.org/os/licensing.
 * See the License for the specific language governing permissions
 * and limitations under the License.
 *
 * When distributing Covered Code, include this CDDL HEADER in each
 * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
 * If applicable, add the following below this CDDL HEADER, with the
 * fields enclosed by brackets "[]" replaced with your own identifying
 * information: Portions Copyright [yyyy] [name of copyright owner]
 *
 * CDDL HEADER END
 */
/*
 * Copyright 2003 Sun Microsystems, Inc.  All rights reserved.
 * Use is subject to license terms.
 */

#pragma ident	"%Z%%M%	%I%	%E% SMI" 

/*
 *	Converts files from one char set to another
 *
 *	Written 11/09/87	Eddy Bell
 *
 */


/*
 *  INCLUDED and DEFINES
 */
#include	<stdio.h>
#include	<fcntl.h>
#include	<sys/systeminfo.h>
#include	<stdlib.h>
#include	<string.h>
#include	<errno.h>

/*#include	<io.h>			for microsoft c 4.0 */

#define 	CONTENTS_ASCII	0
#define 	CONTENTS_ASCII8 1
#define 	CONTENTS_ISO	2
#define 	CONTENTS_DOS	3
#ifdef _F_BIN
#define DOS_BUILD 1
#else
#define UNIX_BUILD 1
#endif

/******************************************************************************
 * INCLUDES AND DEFINES
 ******************************************************************************/
#ifdef UNIX_BUILD
#include <sys/types.h>
#include	<sys/kbio.h>
#include	<sys/time.h>
#include	<fcntl.h>
#include "../sys/dos_iso.h"
#endif

#ifdef DOS_BUILD
#include <dos.h>
#include "..\sys\dos_iso.h"
#endif


#define 	GLOBAL
#define 	LOCAL	static
#define 	VOID	int
#define 	BOOL	int

#define 	FALSE	0
#define 	TRUE	~FALSE

#define 	CR	0x0D
#define 	LF	0x0A
#define 	DOS_EOF 0x1A
#define		MAXLEN	1024


/******************************************************************************
 * FUNCTION AND VARIABLE DECLARATIONS
 ******************************************************************************/
static	void	error();
static	void	usage();
static int	tmpfd = -1;

/******************************************************************************
* ENTRY POINTS
 ******************************************************************************/

int
main(int argc, char **argv)
{
   FILE *in_stream = NULL;
   FILE *out_stream = NULL;
	unsigned char tmp_buff[512];
	unsigned char *src_str, *dest_str;
	char	 *in_file_name, *out_file_name;
   int num_read, i, j, out_len, translate_mode, same_name;			       /* char count for fread() */
   unsigned char * dos_to_iso;
	int	type;
	int	code_page_overide; /* over ride of default codepage */
#ifdef UNIX_BUILD
	int	kbdfd;
#endif
	char	sysinfo_str[MAXLEN];

	same_name = FALSE;
	out_file_name = (char *)0;

    /*	The filename parameter is positionally dependent - it must be the
     *	second argument, immediately following the program name. Except
     *	when a char set switch is passed then the file name must be third
     *	argument.
     */

	argv++;
	in_stream = stdin;
	out_stream = stdout;
	j = 0;  /* count for file names 0 -> source 1-> dest */
	translate_mode = CONTENTS_ISO; /*default trans mode*/
	code_page_overide = 0;
	for (i=1; i<argc; i++) {
      		if (*argv[0] == '-') {
			if (argc > 1 && !strncmp(*argv,"-iso",4)) {
				translate_mode = CONTENTS_ISO;
				argv++;
			} else if (argc > 1 && !strncmp(*argv,"-7",2)) {
				translate_mode = CONTENTS_ASCII;
				argv++;
			} else if (argc > 1 && !strncmp(*argv,"-ascii",6)) {
				translate_mode = CONTENTS_DOS;
				argv++;
			} else if (argc > 1 && !strncmp(*argv,"-437",4)) {
				code_page_overide = CODE_PAGE_US;
				argv++;
			} else if (argc > 1 && !strncmp(*argv,"-850",4)) {
				code_page_overide = CODE_PAGE_MULTILINGUAL;
				argv++;
			} else if (argc > 1 && !strncmp(*argv,"-860",4)) {
				code_page_overide = CODE_PAGE_PORTUGAL;
				argv++;
			} else if (argc > 1 && !strncmp(*argv,"-863",4)) {
				code_page_overide = CODE_PAGE_CANADA_FRENCH;
				argv++;
			} else if (argc > 1 && !strncmp(*argv,"-865",4)) {
				code_page_overide = CODE_PAGE_NORWAY;
				argv++;
			} else
				argv++;
			continue;
		}else{  /* not a command so must be filename */
			switch(j){
				case IN_FILE:	/* open in file from cmdline */
		       			in_file_name = *argv;
		       			j++;  /* next file name is outfile */
			       	break;

				case OUT_FILE:	/* open out file from cmdline */
					out_file_name = *argv;
					j++;
			   	break;

				default:
					usage();
			}
		}
		
	
	argv++;
	}

	/* input file is specified */
	if (j > 0) {
		in_stream = fopen(in_file_name, "r");
		if (in_stream == NULL)
			error("Couldn't open input file %s.", in_file_name);
	}

	/* output file is secified */
	if (j > 1) {
		if(!strcmp(in_file_name, out_file_name)){
			/* input and output have same name */
			if (access(out_file_name, 2))
				error("%s not writable.", out_file_name);
			strcpy(out_file_name, "/tmp/udXXXXXX");
			tmpfd = mkstemp(out_file_name);
			if (tmpfd == -1) {
				error("Couldn't create output file %s.",
				    out_file_name);
			}
			(void) close(tmpfd);
			same_name = TRUE;
		} else
			same_name = FALSE;
		out_stream = fopen(out_file_name, "w");
		if (out_stream == NULL) {
			(void) unlink(out_file_name);
			error("Couldn't open output file %s.", out_file_name);
		}
	}

#ifdef _F_BIN
	setmode(fileno(in_stream), O_BINARY);
	setmode(fileno(out_stream), O_BINARY);
#endif

#ifdef UNIX_BUILD
	if(!code_page_overide){
		if (sysinfo(SI_ARCHITECTURE,sysinfo_str,MAXLEN)  < 0) {
			fprintf(stderr,"could not obtain system information\n");
			(void) unlink(out_file_name);
			exit(1);
		
		}
		if (strcmp(sysinfo_str,"i386")) {
			if ((kbdfd = open("/dev/kbd", O_WRONLY)) < 0) {
				fprintf(stderr, "could not open /dev/kbd to "
				    "get keyboard type US keyboard assumed\n");
			}
			if (ioctl(kbdfd, KIOCLAYOUT, &type) < 0) {
				fprintf(stderr,"could not get keyboard type US keyboard assumed\n");
			}
		} else {
			type = 0;
		}
		switch(type){
			case	0:
			case	1:	/* United States */
				dos_to_iso = &dos_to_iso_cp_437[0];
			break;
	
			case	2:	/* Belgian French */
				dos_to_iso = &dos_to_iso_cp_437[0];
			break;
	
			case	3:	/* Canadian French */
				dos_to_iso = &dos_to_iso_cp_863[0];
			break;
	
			case	4:	/* Danish */
				dos_to_iso = &dos_to_iso_cp_865[0];
			break;
	
			case	5:	/* German */
				dos_to_iso = &dos_to_iso_cp_437[0];
			break;
	
			case	6:	/* Italian */
				dos_to_iso = &dos_to_iso_cp_437[0];
			break;
	
			case	7:	/* Netherlands Dutch */
				dos_to_iso = &dos_to_iso_cp_437[0];
			break;
	
			case	8:	/* Norwegian */
				dos_to_iso = &dos_to_iso_cp_865[0];
			break;
	
			case	9:	/* Portuguese */
				dos_to_iso = &dos_to_iso_cp_860[0];
			break;
	
			case	10:	/* Spanish */
				dos_to_iso = &dos_to_iso_cp_437[0];
			break;
	
			case	11:	/* Swedish Finnish */
				dos_to_iso = &dos_to_iso_cp_437[0];
			break;
	
			case	12:	/* Swiss French */
				dos_to_iso = &dos_to_iso_cp_437[0];
			break;
	
			case	13:	/* Swiss German */
				dos_to_iso = &dos_to_iso_cp_437[0];
			break;
	
			case	14:	/* United Kingdom */
				dos_to_iso = &dos_to_iso_cp_437[0];
	
			break;
			
			default:
				dos_to_iso = &dos_to_iso_cp_437[0];
			break;
		}
	}else{
		switch(code_page_overide){
			case CODE_PAGE_US:
				dos_to_iso = &dos_to_iso_cp_437[0];
			break;
			
			case CODE_PAGE_MULTILINGUAL:
				dos_to_iso = &dos_to_iso_cp_850[0];
			break;
			
			case CODE_PAGE_PORTUGAL:
				dos_to_iso = &dos_to_iso_cp_860[0];
			break;
			
			case CODE_PAGE_CANADA_FRENCH:
				dos_to_iso = &dos_to_iso_cp_863[0];
			break;
			
			case CODE_PAGE_NORWAY:
				dos_to_iso = &dos_to_iso_cp_865[0];
			break;
		}
	}	
	
#endif
#ifdef DOS_BUILD
	if(!code_page_overide){
		{
		union REGS regs;
		regs.h.ah = 0x66;	/* get/set global code page */
		regs.h.al = 0x01;		/* get */
		intdos(&regs, &regs);
		type = regs.x.bx;
		}
		switch(type){
			case	437:	/* United States */
				dos_to_iso = &dos_to_iso_cp_437[0];
			break;
	
			case	850:	/* Multilingual */
				dos_to_iso = &dos_to_iso_cp_850[0];
			break;
			
			case	860:	/* Portuguese */
				dos_to_iso = &dos_to_iso_cp_860[0];
			break;
			
			case	863:	/* Canadian French */
				dos_to_iso = &dos_to_iso_cp_863[0];
			break;
	
			case	865:	/* Danish */
				dos_to_iso = &dos_to_iso_cp_865[0];
			break;
	
			default:
				dos_to_iso = &dos_to_iso_cp_437[0];
			break;
		}
	}else{
		switch(code_page_overide){
			case CODE_PAGE_US:
				dos_to_iso = &dos_to_iso_cp_437[0];
			break;
			
			case CODE_PAGE_MULTILINGUAL:
				dos_to_iso = &dos_to_iso_cp_850[0];
			break;
			
			case CODE_PAGE_PORTUGAL:
				dos_to_iso = &dos_to_iso_cp_860[0];
			break;
			
			case CODE_PAGE_CANADA_FRENCH:
				dos_to_iso = &dos_to_iso_cp_863[0];
			break;
			
			case CODE_PAGE_NORWAY:
				dos_to_iso = &dos_to_iso_cp_865[0];
			break;
		}
	}	
	
	
#endif

    /*	While not EOF, read in chars and send them to out_stream
     *	if current char is not a CR.
     */

    do {
		num_read = fread(&tmp_buff[0], 1, 100, in_stream);
		i = 0;
		out_len = 0;
		src_str = dest_str = &tmp_buff[0];
		switch (translate_mode){
			case CONTENTS_ISO:
				{
				while ( i++ != num_read ){
					if( *src_str == '\r'){
						src_str++;
						}
					else{
						out_len++;
						*dest_str++ = dos_to_iso[*src_str++];
						}
					}
				}
				break;

			case CONTENTS_ASCII:
				{
				while ( i++ != num_read){
					if( *src_str == '\r'){
						src_str++;
						continue;
						}
					else if ( *src_str > 127 ){
						*dest_str++ = (unsigned char) ' ';
						src_str++;
						out_len++;
						}
					else{
						out_len++;
						*dest_str++ = *src_str++;
						}
					}
				}
				break;

			case CONTENTS_DOS:
				{
				while ( i++ != num_read){
					if( *src_str == '\r'){
						src_str++;
						continue;
						}
						*dest_str++ =	*src_str++;
						out_len++;
					}
				}
				break;
			}
		if (out_len > num_read)
			out_len = num_read;
		if (tmp_buff[out_len-2] == DOS_EOF)
			out_len -= 2;
		else if (tmp_buff[out_len-1] == DOS_EOF)
			out_len -= 1;

		if( out_len > 0 &&
		    out_len != (i= fwrite(&tmp_buff[0], 1, out_len, out_stream)))
			error("Error writing %s.", out_file_name);

		} while (!feof(in_stream));

	fclose(out_stream);
	fclose(in_stream);
	if(same_name){
		unlink(in_file_name);
		in_stream = fopen(out_file_name, "r");
		out_stream = fopen(in_file_name, "w");
#ifdef _F_BIN
		setmode(fileno(in_stream), O_BINARY);
		setmode(fileno(out_stream), O_BINARY);
#endif
		while ((num_read = (unsigned)fread(tmp_buff, 1, sizeof tmp_buff, in_stream)) != 0) {
		   if( num_read != fwrite(tmp_buff, 1, num_read, out_stream))
			error("Error writing %s.", in_file_name);
		}
		fclose(out_stream);
		fclose(in_stream);
		unlink(out_file_name);
	}
	return (0);
}

void	error(format, args)
	char	*format;
	char	*args;
{
	fprintf(stderr, "dos2unix: ");
	fprintf(stderr, format, args);
	fprintf(stderr, "  %s.\n", strerror(errno));
	exit(1);
}

void usage()
{
	fprintf(stderr, "usage: dos2unix [ -ascii ] [ -iso ] [ -7 ] [ originalfile [ convertedfile ] ]\n");
	exit(1);
}