Blob Blame History Raw
/****************************************************************************/
/*  argv.h: a thread-safe argument vector parser and usage screen generator */
/*  Copyright (C) 2015  Z. Gilboa                                           */
/*  Released under the Standard MIT License; see COPYING.SOFORT.            */
/*  This file is (also) part of sofort: portable software project template. */
/****************************************************************************/

#ifndef ARGV_H
#define ARGV_H

#include <stdbool.h>
#include <stdint.h>
#include <stddef.h>
#include <errno.h>
#include <string.h>
#include <stdlib.h>
#include <stdio.h>

#define ARGV_VERBOSITY_NONE		0x00
#define ARGV_VERBOSITY_ERRORS		0x01
#define ARGV_VERBOSITY_STATUS		0x02
#define ARGV_CLONE_VECTOR		0x80

enum argv_optarg {
	ARGV_OPTARG_NONE,
	ARGV_OPTARG_REQUIRED,
	ARGV_OPTARG_OPTIONAL,
};

enum argv_mode {
	ARGV_MODE_SCAN,
	ARGV_MODE_COPY,
};

enum argv_error {
	ARGV_ERROR_OK,
	ARGV_ERROR_INTERNAL,
	ARGV_ERROR_SHORT_OPTION,
	ARGV_ERROR_LONG_OPTION,
	ARGV_ERROR_OPTARG_NONE,
	ARGV_ERROR_OPTARG_REQUIRED,
	ARGV_ERROR_OPTARG_PARADIGM,
};

struct argv_option {
	const char *		long_name;
	const char		short_name;
	int			tag;
	enum argv_optarg	optarg;
	const char *		paradigm;
	const char *		argname;
	const char *		description;
};

struct argv_entry {
	const char *	arg;
	int		tag;
	bool		fopt;
	bool		fval;
	bool		fnoscan;
	enum argv_error errcode;
};

struct argv_meta {
	const char **		argv;
	struct argv_entry *	entries;
};

struct argv_meta_impl {
	const char **		argv;
	char *			strbuf;
	struct argv_meta	meta;
};

struct argv_ctx {
	int				flags;
	int				mode;
	int				nentries;
	enum argv_error 		errcode;
	const char *			errch;
	const struct argv_option *	erropt;
	const char *			program;
};

#ifdef ARGV_DRIVER

static const char * argv_program_name(const char *);

static void argv_usage(
	FILE *,
	const char *	header,
	const struct	argv_option[],
	const char *	mode);

static struct argv_meta * argv_get(
	const char **,
	const struct argv_option[],
	int flags);

static void argv_free(struct argv_meta *);




/*------------------------------------*/
/* implementation of static functions */
/*------------------------------------*/

static const struct argv_option * argv_short_option(
	const char *			ch,
	const struct argv_option	options[],
	struct argv_entry *		entry)
{
	const struct argv_option *	option;

	for (option=options; option->long_name || option->short_name; option++) {
		if (option->short_name == *ch) {
			entry->tag	= option->tag;
			entry->fopt	= true;
			return option;
		}
	}

	return 0;
}

static const struct argv_option * argv_long_option(
	const char *			ch,
	const struct argv_option	options[],
	struct argv_entry *		entry)
{
	const struct argv_option *	option;
	const char *			arg;
	size_t				len;

	for (option=options; option->long_name || option->short_name; option++) {
		len = option->long_name ? strlen(option->long_name) : 0;

		if (len && !(strncmp(option->long_name,ch,len))) {
			arg = ch + len;

			if (!*arg || (*arg == '=')) {
				entry->tag	= option->tag;
				entry->fopt	= true;
				return option;
			}
		}
	}

	return 0;
}

static inline bool is_short_option(const char * arg)
{
	return (arg[0]=='-') && arg[1] && (arg[1]!='-');
}

static inline bool is_long_option(const char * arg)
{
	return (arg[0]=='-') && (arg[1]=='-') && arg[2];
}

static inline bool is_last_option(const char * arg)
{
	return (arg[0]=='-') && (arg[1]=='-') && !arg[2];
}

static inline bool is_arg_in_paradigm(const char * arg, const char * paradigm)
{
	size_t		len;
	const char *	ch;

	for (ch=paradigm,len=strlen(arg); ch; ) {
		if (!strncmp(arg,ch,len)) {
			if (!*(ch += len))
				return true;
			else if (*ch == '|')
				return true;
		}

		if ((ch = strchr(ch,'|')))
			ch++;
	}

	return false;
}

static inline const struct argv_option * option_from_tag(
	const struct argv_option	options[],
	int				tag)
{
	const struct argv_option *	option;

	for (option=options; option->short_name || option->long_name; option++)
		if (option->tag == tag)
			return option;
	return 0;
}

static void argv_scan(
	const char **			argv,
	const struct argv_option	options[],
	struct argv_ctx *		ctx,
	struct argv_meta *		meta)
{
	const char **			parg;
	const char *			ch;
	const char *			val;
	const struct argv_option *	option;
	struct argv_entry		entry;
	struct argv_entry *		mentry;
	enum argv_error			ferror;
	bool				fval;
	bool				fnext;
	bool				fshort;
	bool				fnoscan;

	argv++;
	parg	= argv;
	ch	= *parg;
	ferror	= ARGV_ERROR_OK;
	fshort	= false;
	fnoscan	= false;
	fval	= false;
	mentry	= meta ? meta->entries : 0;

	while (ch && (ferror == ARGV_ERROR_OK)) {
		option = 0;

		if (fnoscan)
			fval = true;

		else if (is_last_option(ch))
			fnoscan = true;

		else if ((fshort || is_short_option(ch))) {
			if (!fshort)
				ch++;

			if ((option = argv_short_option(ch,options,&entry))) {
				if (ch[1]) {
					ch++;
					fnext	= false;
					fshort	= (option->optarg == ARGV_OPTARG_NONE);
				} else {
					parg++;
					ch	= *parg;
					fnext	= true;
					fshort	= false;
				}

				if (option->optarg == ARGV_OPTARG_NONE) {
					if (!fnext && ch && (*ch == '-'))
						ferror = ARGV_ERROR_OPTARG_NONE;
					else
						fval = false;
				} else if (!fnext)
					fval = true;
				else if (option->optarg == ARGV_OPTARG_REQUIRED) {
					if (ch && is_short_option(ch))
						ferror = ARGV_ERROR_OPTARG_REQUIRED;
					else if (ch && is_long_option(ch))
						ferror = ARGV_ERROR_OPTARG_REQUIRED;
					else if (ch && is_last_option(ch))
						ferror = ARGV_ERROR_OPTARG_REQUIRED;
					else if (ch)
						fval = true;
					else
						ferror = ARGV_ERROR_OPTARG_REQUIRED;
				} else {
					/* ARGV_OPTARG_OPTIONAL */
					if (ch && is_short_option(ch))
						fval = false;
					else if (ch && is_long_option(ch))
						fval = false;
					else if (ch && is_last_option(ch))
						fval = false;
					else
						fval = ch;
				}
			} else
				ferror = ARGV_ERROR_SHORT_OPTION;

		} else if ((is_long_option(ch))) {
			if ((option = argv_long_option(ch+=2,options,&entry))) {
				val = ch + strlen(option->long_name);

				/* val[0] is either '=' or '\0' */
				if (!val[0]) {
					parg++;
					ch = *parg;
				}

				if (option->optarg == ARGV_OPTARG_NONE) {
					if (val[0]) {
						ferror = ARGV_ERROR_OPTARG_NONE;
						ctx->errch = val + 1;
					} else
						fval = false;
				} else if (val[0] && !val[1])
					ferror = ARGV_ERROR_OPTARG_REQUIRED;
				else if (val[0] && val[1]) {
					fval = true;
					ch   = ++val;
				} else if (option->optarg == ARGV_OPTARG_REQUIRED) {
					if (!val[0] && !*parg)
						ferror = ARGV_ERROR_OPTARG_REQUIRED;
					else if (*parg && is_short_option(*parg))
						ferror = ARGV_ERROR_OPTARG_REQUIRED;
					else if (*parg && is_long_option(*parg))
						ferror = ARGV_ERROR_OPTARG_REQUIRED;
					else if (*parg && is_last_option(*parg))
						ferror = ARGV_ERROR_OPTARG_REQUIRED;
					else
						fval = true;
				} else {
					/* ARGV_OPTARG_OPTIONAL */
					if (!val[0] && !*parg)
						fval = false;
					if (*parg && is_short_option(*parg))
						fval = false;
					else if (*parg && is_long_option(*parg))
						fval = false;
					else if (*parg && is_last_option(*parg))
						fval = false;
					else
						fval = *parg;
				}
			} else
				ferror = ARGV_ERROR_LONG_OPTION;
		}

		if (ferror == ARGV_ERROR_OK)
			if (option && fval && option->paradigm)
				if (!is_arg_in_paradigm(ch,option->paradigm))
					ferror = ARGV_ERROR_OPTARG_PARADIGM;

		if (ferror != ARGV_ERROR_OK) {
			ctx->errcode = ferror;
			ctx->errch   = ctx->errch ? ctx->errch : ch;
			ctx->erropt  = option;
			return;
		} else if (ctx->mode == ARGV_MODE_SCAN) {
			if (!fnoscan)
				ctx->nentries++;
			else if (fval)
				ctx->nentries++;

			if (fval || !option) {
				parg++;
				ch = *parg;
			}
		} else if (ctx->mode == ARGV_MODE_COPY) {
			if (fnoscan) {
				if (fval) {
					mentry->arg	= ch;
					mentry->fnoscan = true;
					mentry++;
				}

				parg++;
				ch = *parg;
			} else if (option) {
				mentry->arg	= fval ? ch : 0;
				mentry->tag	= option->tag;
				mentry->fopt	= true;
				mentry->fval	= fval;
				mentry++;

				if (fval) {
					parg++;
					ch = *parg;
				}
			} else {
				mentry->arg = ch;
				mentry++;
				parg++;
				ch = *parg;
			}
		}
	}
}

static const char * argv_program_name(const char * program_path)
{
	const char * ch;

	if (program_path) {
		if ((ch = strrchr(program_path,'/')))
			return *(++ch) ? ch : 0;

		if ((ch = strrchr(program_path,'\\')))
			return *(++ch) ? ch : 0;
	}

	return program_path;
}

static void argv_show_error(struct argv_ctx * ctx)
{
	fprintf(stderr,"%s: error: ",ctx->program);

	switch (ctx->errcode) {
		case ARGV_ERROR_SHORT_OPTION:
			fprintf(stderr,"'%c' is not a valid short option\n",*ctx->errch);
			break;

		case ARGV_ERROR_LONG_OPTION:
			fprintf(stderr,"'--%s' is not a valid long option\n",ctx->errch);
			break;

		case ARGV_ERROR_OPTARG_NONE:
			fprintf(stderr,"'%s' is not a valid option value for [%s%c%s%s%s] (option values may not be specified)\n",
				ctx->errch,
				ctx->erropt->short_name ? "-" : "",
				ctx->erropt->short_name,
				ctx->erropt->short_name ? "," : "",
				ctx->erropt->long_name ? "--" : "",
				ctx->erropt->long_name);
			break;

		case ARGV_ERROR_OPTARG_REQUIRED:
			fprintf(stderr,"option [%s%c%s%s%s] requires %s %s%s%s\n",
				ctx->erropt->short_name ? "-" : "",
				ctx->erropt->short_name,
				ctx->erropt->short_name ? "," : "",
				ctx->erropt->long_name ? "--" : "",
				ctx->erropt->long_name,
				ctx->erropt->paradigm ? "one of the following values:" : "a value",
				ctx->erropt->paradigm ? "{" : "",
				ctx->erropt->paradigm ? ctx->erropt->paradigm : "",
				ctx->erropt->paradigm ? "}" : "");
			break;

		case ARGV_ERROR_OPTARG_PARADIGM:
			fprintf(stderr,"'%s' is not a valid option value for [%s%c%s%s%s]={%s}\n",
				ctx->errch,
				ctx->erropt->short_name ? "-" : "",
				ctx->erropt->short_name,
				ctx->erropt->short_name ? "," : "",
				ctx->erropt->long_name ? "--" : "",
				ctx->erropt->long_name,
				ctx->erropt->paradigm);
			break;

		case ARGV_ERROR_INTERNAL:
			fputs("internal error",stderr);
			break;

		default:
			break;
	}
}

static void argv_show_status(
	const struct argv_option	options[],
	struct argv_ctx *		ctx,
	struct argv_meta *		meta)
{
	int				argc;
	const char **			argv;
	struct argv_entry *		entry;
	const struct argv_option *	option;
	char				short_name[2] = {0};
	const char *			space = "";

	fputs("\n\nconcatenated command line:\n",stderr);
	for (argv=meta->argv; *argv; argv++) {
		fprintf(stderr,"%s%s",space,*argv);
		space = " ";
	}

	fputs("\n\nargument vector:\n",stderr);
	for (argc=0,argv=meta->argv; *argv; argc++,argv++)
		fprintf(stderr,"argv[%d]: %s\n",argc,*argv);

	fputs("\n\nparsed entries:\n",stderr);
	for (entry=meta->entries; entry->arg || entry->fopt; entry++)
		if (entry->fopt) {
			option = option_from_tag(options,entry->tag);
			short_name[0] = option->short_name;

			if (entry->fval)
				fprintf(stderr,"[-%s,--%s] := %s\n",
					short_name,option->long_name,entry->arg);
			else
				fprintf(stderr,"[-%s,--%s]\n",
					short_name,option->long_name);
		} else
			fprintf(stderr,"<program arg> := %s\n",entry->arg);

	fputs("\n\n",stderr);
}

static struct argv_meta * argv_free_impl(struct argv_meta_impl * imeta)
{
	if (imeta->argv)
		free(imeta->argv);

	if (imeta->strbuf)
		free(imeta->strbuf);

	if (imeta->meta.entries)
		free(imeta->meta.entries);

	free(imeta);
	return 0;
}

static struct argv_meta * argv_alloc(const char ** argv, struct argv_ctx * ctx)
{
	struct argv_meta_impl * imeta;
	const char **		vector;
	char *			dst;
	size_t			size;
	int			argc;
	int			i;

	if (!(imeta = calloc(sizeof(*imeta),1)))
		return 0;

	if (ctx->flags & ARGV_CLONE_VECTOR) {
		for (vector=argv,argc=0,size=0; *vector; vector++) {
			size += strlen(*vector) + 1;
			argc++;
		}

		if (!(imeta->argv = calloc(sizeof(char *),argc+1)))
			return argv_free_impl(imeta);
		else if (!(imeta->strbuf = calloc(size+1,1)))
			return argv_free_impl(imeta);

		for (i=0,dst=imeta->strbuf; i<argc; i++) {
			strcpy(dst,argv[i]);
			imeta->argv[i] = dst;
			dst += strlen(dst)+1;
		}

		imeta->meta.argv = imeta->argv;
	} else
		imeta->meta.argv = argv;

	if (!(imeta->meta.entries = calloc(sizeof(struct argv_entry),ctx->nentries+1)))
		return argv_free_impl(imeta);
	else
		return &imeta->meta;
}

static struct argv_meta * argv_get(
	const char *			argv[],
	const struct argv_option	options[],
	int				flags)
{
	struct argv_meta *	meta;
	struct argv_ctx		ctx = {flags,ARGV_MODE_SCAN,0,0,0,0};

	argv_scan(argv,options,&ctx,0);

	if (ctx.errcode != ARGV_ERROR_OK) {
		if (!ctx.program)
			ctx.program = argv_program_name(argv[0]);

		if (ctx.flags & ARGV_VERBOSITY_ERRORS)
			argv_show_error(&ctx);

		return 0;
	}

	if (!(meta = argv_alloc(argv,&ctx)))
		return 0;

	ctx.mode = ARGV_MODE_COPY;
	argv_scan(meta->argv,options,&ctx,meta);

	if (ctx.errcode != ARGV_ERROR_OK) {
		if (!ctx.program)
			ctx.program = argv[0];

		ctx.errcode = ARGV_ERROR_INTERNAL;
		argv_show_error(&ctx);
		argv_free(meta);

		return 0;
	}

	if (ctx.flags & ARGV_VERBOSITY_STATUS)
		argv_show_status(options,&ctx,meta);

	return meta;
}

static void argv_free(struct argv_meta * xmeta)
{
	struct argv_meta_impl * imeta;
	uintptr_t		addr;

	if (xmeta) {
		addr  = (uintptr_t)xmeta - offsetof(struct argv_meta_impl,meta);
		imeta = (struct argv_meta_impl *)addr;
		argv_free_impl(imeta);
	}
}

static void argv_usage(
	FILE *				file,
	const char *    		header,
	const struct argv_option	options[],
	const char *			mode)
{
	const struct argv_option *	option;
	bool				fshort,flong;
	bool				fnewline;
	size_t				len,optlen;
	size_t				paralen,rparalen,mparalen;
	size_t				desclen,rdesclen;

	char *				para;
	char *				next_para;
	char *				desc;
	char *				next_desc;
	char *				paradigm;
	char *				buf;
	size_t				buflen;
	const char *			sdescription;
	const char *			sargname;

	const char			indent[] = "  ";
	const int			rblen  = sizeof("}") - sizeof(char);
	const int			rbblen = sizeof("{]") - sizeof(char);
	const int			brcklen= sizeof("[]") - sizeof(char);
	const int			solen  = sizeof("-") - sizeof(char);
	const int			lolen  = sizeof("--") - sizeof(char);
	const int			slolen = sizeof("-X,--") - sizeof(char);

	fshort = mode ? !strcmp(mode,"short") : 0;
	flong  = fshort ? 0 : mode && !strcmp(mode,"long");

	if (header)
		fprintf(stdout,"%s",header);

	for (option=options,optlen=0,paralen=0; option->short_name || option->long_name; option++) {
		if (fshort)
			len = option->short_name ? sizeof(char) + solen : 0;
		else if (flong)
			len = option->long_name ? strlen(option->long_name) + lolen : 0;
		else
			len = option->long_name ? strlen(option->long_name) + slolen : 0;

		if (len) {
			if (len > optlen)
				optlen = len;

			if (option->paradigm)
				len = strlen(option->paradigm) + strlen("{}");
			else if (option->argname)
				len = strlen(option->argname);
			else if (option->optarg != ARGV_OPTARG_NONE)
				len = strlen("<val>");

			if (option->optarg == ARGV_OPTARG_OPTIONAL)
				len += strlen("[]");

			if (len > paralen)
				paralen = len;
		}
	}

	optlen += 8;
	optlen &= (~7);

	if (paralen) {
		paralen += (8);
		paralen &= (~7);
		mparalen = paralen + 2*rbblen;

		if (optlen + paralen > 64)
			paralen = 32;
	}

	/* account for '  ','\t', try to fit in 80 or 96 columns */
	if (optlen+paralen+2+8 < 80-32)
		desclen = 80 - (optlen+paralen+2+8);
	else if (optlen+paralen+2+8 < 96-32)
		desclen = 96 - (optlen+paralen+2+8);
	else
		desclen = 32;

	paradigm = next_para = buf = 0;
	fnewline = false;
	rparalen = 0;
	mparalen = 0;

	for (option=options,buflen=0,rdesclen=1; option->short_name || option->long_name; option++) {
		if (option->paradigm) {
			if (option->optarg == ARGV_OPTARG_OPTIONAL)
				rparalen = strlen(option->paradigm) - 2*rbblen;
			else
				rparalen = strlen(option->paradigm) - 2*rblen;
		}

		sdescription 	= option->description ? option->description : "";
		sargname	= option->argname ? option->argname : "";

		if (option->paradigm)
			rdesclen = snprintf(buf,buflen,sdescription,option->paradigm);
		else
			rdesclen = snprintf(buf,buflen,sdescription,sargname);

		if (fnewline)
			(void)0;

		if ((rparalen > paralen) || (rdesclen > desclen)) {
			if (!fnewline) {
				(void)0;
				fnewline = true;
			}
		} else
			fnewline = false;

		if (fshort)
			fprintf(file,"%s-%-*c",indent,(int)(optlen-solen),option->short_name);
		else if (flong)
			fprintf(file,"%s--%-*s",indent,(int)(optlen-lolen),option->long_name);
		else {
			if (option->short_name && option->long_name)
				fprintf(file,"%s-%c,--%-*s",indent,option->short_name,(int)(optlen-slolen),option->long_name);
			else if (option->short_name)
				 fprintf(file,"%s-%-*c",indent,(int)(optlen-solen),option->short_name);
			else
				fprintf(file,"%s%3s--%-*s",indent,"",(int)(optlen-slolen),option->long_name);
		}

		if (rdesclen > buflen) {
			if (buf) {
				free(buf);
				buf = 0;
			}

			len =  rdesclen + 512;
			len &= (~511);

			if ((buf = calloc(len,1))) {
				buflen = len;

				if (option->paradigm)
					rdesclen = snprintf(buf,buflen,option->description,option->paradigm);
				else
					rdesclen = snprintf(buf,buflen,option->description,option->argname);
			} else {
				buflen = 0;
				continue;
			}
		}

		if (option->paradigm && (rparalen <= paralen)) {
			if (option->optarg == ARGV_OPTARG_OPTIONAL)
				fprintf(file,"[{%s}]%-*c",option->paradigm,(int)(paralen-strlen(option->paradigm)-2*rbblen),' ');
			else
				fprintf(file,"{%s}%-*c",option->paradigm,(int)(paralen-strlen(option->paradigm)-rbblen),' ');
			para = (char *)0;
		} else if (option->paradigm) {
			if (!paradigm && !(paradigm = calloc(mparalen,1))) {
				fputc('\n',file);
				continue;
			} else
				para = strcpy(paradigm,option->paradigm);

			if (option->optarg == ARGV_OPTARG_OPTIONAL) {
				fputs("[{",file);
				rparalen = paralen - rbblen;
			} else {
				fputc('{',file);
				rparalen = paralen - rblen;
			}
		} else if (option->argname) {
			if (option->optarg == ARGV_OPTARG_OPTIONAL)
				fprintf(file,"[%s]%-*c",option->argname,(int)(paralen-strlen(option->argname)-brcklen),' ');
			else
				fprintf(file,"%s%-*c",option->argname,(int)(paralen-strlen(option->argname)),' ');
			para = (char *)0;
		} else {
			fprintf(file,"%-*c",(int)paralen,' ');
			para = (char *)0;
		}


		if (!para && option->description && rdesclen <= desclen) {
			fputc('\t',file);
			fputs(buf,file);
			desc = (char *)0;
		} else if (option->description)
			desc = buf;
		else
			desc = (char *)0;

		while (para || desc) {
			if (para) {
				for (next_para=para+rparalen-1; (next_para>para) && (*next_para!='|'); )
					next_para--;

				if (para > paradigm) {
					if (option->optarg == ARGV_OPTARG_OPTIONAL)
						fputs("  ",file);
					else
						fputc(' ',file);
				}

				if (*next_para != '|') {
					fprintf(file,"%s",para);
					para = (char *)0;
				} else if (next_para > para) {
					*next_para = '\0';
					fprintf(file,"%-*s",(int)rparalen,para);
					*next_para = '|';
					para = next_para;
					rparalen = strlen(para);

					/* 2*rbblen,2*rblen, etc.: account for indentation */
					if (option->optarg == ARGV_OPTARG_OPTIONAL)
						rparalen = (rparalen+2*rbblen > paralen) ? paralen-rbblen : rparalen;
					else
						rparalen = (rparalen+2*rblen > paralen) ? paralen-rblen : rparalen;
				} else {
					if (option->optarg == ARGV_OPTARG_OPTIONAL)
						fprintf(file,"%s}]%-*c",para,(int)(paralen-strlen(para)-rbblen),' ');
					else
						fprintf(file,"%s}%-*c",para,(int)(paralen-strlen(para)-rblen),' ');
					para = (char *)0;
				}
			} else if (desc > buf)
				fprintf(file,"%-*c",(int)paralen,' ');

			if (desc) {
				if (desc > buf)
					fputs("\t ",file);
				else
					fputc('\t',file);

				if ((rdesclen = strlen(desc)+(desc>buf)) <= desclen) {
					fputs(desc,file);
					desc = (char *)0;
				} else {
					for (next_desc=desc+desclen-1; (next_desc>desc) && (*next_desc!=' ') && (*next_desc!='\n'); )
						next_desc--;

					if ((*next_desc != ' ') && (*next_desc!='\n')) {
						fputs(desc,file);
						desc = (char *)0;
					} else if (next_desc > desc) {
						*next_desc = '\0';
						fputs(desc,file);
						desc = ++next_desc;
					} else {
						fputs(desc,file);
						desc = (char *)0;
					}
				}
			}

			if (para || desc)
				fprintf(file,"\n%s%-*c",indent,(int)optlen,' ');
		}

		fputc('\n',file);
	}

	if (paradigm)
		free(paradigm);

	if (buf)
		free(buf);
}

#endif

#endif