aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authordcw <d.white@imperial.ac.uk>2023-03-19 22:32:16 +0000
committerdcw <d.white@imperial.ac.uk>2023-03-19 22:32:16 +0000
commitb23deebc277818634fb561c424a1fad6cd7fe059 (patch)
tree3e22d294a9f93c16a2e2557566a3e3b7ec7edfe8
parenta1045c99cbfc1c89f9322b0c841b7951d9608d03 (diff)
downloadperlweeklychallenge-club-b23deebc277818634fb561c424a1fad6cd7fe059.tar.gz
perlweeklychallenge-club-b23deebc277818634fb561c424a1fad6cd7fe059.tar.bz2
perlweeklychallenge-club-b23deebc277818634fb561c424a1fad6cd7fe059.zip
imported my solutions to this week's tasks, in Perl and C
-rw-r--r--challenge-208/duncan-c-white/C/Makefile19
-rw-r--r--challenge-208/duncan-c-white/C/README11
-rw-r--r--challenge-208/duncan-c-white/C/args.c207
-rw-r--r--challenge-208/duncan-c-white/C/args.h11
-rw-r--r--challenge-208/duncan-c-white/C/ch-1.c176
-rw-r--r--challenge-208/duncan-c-white/C/ch-2.c121
-rw-r--r--challenge-208/duncan-c-white/C/csvsplit.c47
-rw-r--r--challenge-208/duncan-c-white/C/csvsplit.h14
-rw-r--r--challenge-208/duncan-c-white/C/parseints.c114
-rw-r--r--challenge-208/duncan-c-white/C/parseints.h1
-rw-r--r--challenge-208/duncan-c-white/C/printarray.c39
-rw-r--r--challenge-208/duncan-c-white/C/printarray.h1
-rw-r--r--challenge-208/duncan-c-white/README97
-rwxr-xr-xchallenge-208/duncan-c-white/perl/ch-1.pl108
-rwxr-xr-xchallenge-208/duncan-c-white/perl/ch-2.pl108
15 files changed, 1035 insertions, 39 deletions
diff --git a/challenge-208/duncan-c-white/C/Makefile b/challenge-208/duncan-c-white/C/Makefile
new file mode 100644
index 0000000000..513f8703b6
--- /dev/null
+++ b/challenge-208/duncan-c-white/C/Makefile
@@ -0,0 +1,19 @@
+# Makefile rules generated by CB
+CC = gcc
+CFLAGS = -Wall -g
+BUILD = ch-1 ch-2
+
+all: $(BUILD)
+
+clean:
+ /bin/rm -f $(BUILD) *.o core a.out
+
+args.o: args.c
+ch-1: ch-1.o args.o csvsplit.o
+ch-1.o: ch-1.c args.h csvsplit.h
+ch-2: ch-2.o args.o parseints.o printarray.o
+ch-2.o: ch-2.c args.h parseints.h printarray.h
+csvsplit.o: csvsplit.c csvsplit.h
+parseints.o: parseints.c args.h parseints.h printarray.h
+printarray.o: printarray.c
+
diff --git a/challenge-208/duncan-c-white/C/README b/challenge-208/duncan-c-white/C/README
new file mode 100644
index 0000000000..dd5f3346f7
--- /dev/null
+++ b/challenge-208/duncan-c-white/C/README
@@ -0,0 +1,11 @@
+Thought I'd also have a go at translating ch-1.pl and ch-2.pl into C..
+
+Both C versions produce identical (non-debugging and debugging)
+output to the Perl originals.
+
+These C versions use most of my regular support modules:
+- a command-line argument processing module args.[ch],
+- a csvlist-of-int parsing module parseints.[ch], and
+- an int-array printing module printarray.[ch].
+- plus a (new for PWC) csv splitting module csvsplit.[ch] to split
+ a single argument into a wordlist
diff --git a/challenge-208/duncan-c-white/C/args.c b/challenge-208/duncan-c-white/C/args.c
new file mode 100644
index 0000000000..d4a2d38b9a
--- /dev/null
+++ b/challenge-208/duncan-c-white/C/args.c
@@ -0,0 +1,207 @@
+#include <stdio.h>
+#include <stdlib.h>
+#include <stdbool.h>
+#include <string.h>
+#include <ctype.h>
+#include <assert.h>
+
+
+bool debug = false;
+
+
+// process_flag_noarg( name, argc, argv );
+// Process the -d flag, and check that there are no
+// remaining arguments.
+void process_flag_noarg( char *name, int argc, char **argv )
+{
+ int arg=1;
+ if( argc>1 && strcmp( argv[arg], "-d" ) == 0 )
+ {
+ debug = true;
+ arg++;
+ }
+
+ int left = argc-arg;
+ if( left != 0 )
+ {
+ fprintf( stderr, "Usage: %s [-d]\n", name );
+ exit(1);
+ }
+}
+
+
+// int argno = process_flag_n_args( name, argc, argv, n, argmsg );
+// Process the -d flag, and check that there are exactly
+// n remaining arguments, return the index position of the first
+// argument. If not, generate a fatal Usage error using the argmsg.
+//
+int process_flag_n_args( char *name, int argc, char **argv, int n, char *argmsg )
+{
+ int arg=1;
+ if( argc>1 && strcmp( argv[arg], "-d" ) == 0 )
+ {
+ debug = true;
+ arg++;
+ }
+
+ int left = argc-arg;
+ if( left != n )
+ {
+ fprintf( stderr, "Usage: %s [-d] %s\n Exactly %d "
+ "arguments needed\n", name, argmsg, n );
+ exit(1);
+ }
+ return arg;
+}
+
+
+// int argno = process_flag_n_m_args( name, argc, argv, min, max, argmsg );
+// Process the -d flag, and check that there are between
+// min and max remaining arguments, return the index position of the first
+// argument. If not, generate a fatal Usage error using the argmsg.
+//
+int process_flag_n_m_args( char *name, int argc, char **argv, int min, int max, char *argmsg )
+{
+ int arg=1;
+ if( argc>1 && strcmp( argv[arg], "-d" ) == 0 )
+ {
+ debug = true;
+ arg++;
+ }
+
+ int left = argc-arg;
+ if( left < min || left > max )
+ {
+ fprintf( stderr, "Usage: %s [-d] %s\n Between %d and %d "
+ "arguments needed\n", name, argmsg, min, max );
+ exit(1);
+ }
+ return arg;
+}
+
+
+// process_onenumarg_default( name, argc, argv, defvalue, &n );
+// Process the -d flag, and check that there is a single
+// remaining numeric argument (or no arguments, in which case
+// we use the defvalue), putting it into n
+void process_onenumarg_default( char *name, int argc, char **argv, int defvalue, int *n )
+{
+ char argmsg[100];
+ sprintf( argmsg, "[int default %d]", defvalue );
+ int arg = process_flag_n_m_args( name, argc, argv, 0, 1, argmsg );
+
+ *n = arg == argc ? defvalue : atoi( argv[arg] );
+}
+
+
+// process_onenumarg( name, argc, argv, &n );
+// Process the -d flag, and check that there is a single
+// remaining numeric argument, putting it into n
+void process_onenumarg( char *name, int argc, char **argv, int *n )
+{
+ int arg = process_flag_n_args( name, argc, argv, 1, "int" );
+
+ // argument is in argv[arg]
+ *n = atoi( argv[arg] );
+}
+
+
+// process_twonumargs( name, argc, argv, &m, &n );
+// Process the -d flag, and check that there are 2
+// remaining numeric arguments, putting them into m and n
+void process_twonumargs( char *name, int argc, char **argv, int *m, int *n )
+{
+ int arg = process_flag_n_args( name, argc, argv, 2, "int" );
+
+ // arguments are in argv[arg] and argv[arg+1]
+ *m = atoi( argv[arg++] );
+ *n = atoi( argv[arg] );
+}
+
+
+// process_twostrargs() IS DEPRECATED: use process_flag_n_m_args() instead
+
+
+// int arr[100];
+// int nel = process_listnumargs( name, argc, argv, arr, 100 );
+// Process the -d flag, and check that there are >= 2
+// remaining numeric arguments, putting them into arr[0..nel-1]
+// and returning nel.
+int process_listnumargs( char *name, int argc, char **argv, int *arr, int maxel )
+{
+ int arg=1;
+ if( argc>1 && strcmp( argv[arg], "-d" ) == 0 )
+ {
+ debug = true;
+ arg++;
+ }
+
+ int left = argc-arg;
+ if( left < 2 )
+ {
+ fprintf( stderr, "Usage: %s [-d] list_of_numeric_args\n", name );
+ exit(1);
+ }
+ if( left > maxel )
+ {
+ fprintf( stderr, "%s: more than %d args\n", name, maxel );
+ exit(1);
+ }
+
+ // elements are in argv[arg], argv[arg+1]...
+
+ if( debug )
+ {
+ printf( "debug: remaining arguments are in arg=%d, "
+ "firstn=%s, secondn=%s..\n",
+ arg, argv[arg], argv[arg+1] );
+ }
+
+ int nel = 0;
+ for( int i=arg; i<argc; i++ )
+ {
+ arr[nel++] = atoi( argv[i] );
+ }
+ arr[nel] = -1;
+ return nel;
+}
+
+
+//
+// bool isint = check_unsigned_int( char *val, int *n );
+// Given an string val, check that there's an unsigned integer
+// in it (after optional whitespace). If there is a valid
+// unsigned integer value, store that integer value in *n and
+// return true; otherwise return false (and don't alter *n).
+bool check_unsigned_int( char *val, int *n )
+{
+ // skip whitespace in val
+ char *p;
+ for( p=val; isspace(*p); p++ )
+ {
+ /*EMPTY*/
+ }
+ if( ! isdigit(*p) ) return false;
+ *n = atoi(p);
+ return true;
+}
+
+
+//
+// bool ok = check_unsigned_real( char *val, double *n );
+// Given an string val, check that there's an unsigned real
+// in it (after optional whitespace). If there is a valid
+// unsigned real value, store that value in *n and
+// return true; otherwise return false (and don't alter *n).
+bool check_unsigned_real( char *val, double *n )
+{
+ // skip whitespace in val
+ char *p;
+ for( p=val; isspace(*p); p++ )
+ {
+ /*EMPTY*/
+ }
+ if( ! isdigit(*p) ) return false;
+ *n = atof(p);
+ return true;
+}
diff --git a/challenge-208/duncan-c-white/C/args.h b/challenge-208/duncan-c-white/C/args.h
new file mode 100644
index 0000000000..8844a8f9c4
--- /dev/null
+++ b/challenge-208/duncan-c-white/C/args.h
@@ -0,0 +1,11 @@
+extern bool debug;
+
+extern void process_flag_noarg( char * name, int argc, char ** argv );
+extern int process_flag_n_args( char * name, int argc, char ** argv, int n, char * argmsg );
+extern int process_flag_n_m_args( char * name, int argc, char ** argv, int min, int max, char * argmsg );
+extern void process_onenumarg_default( char * name, int argc, char ** argv, int defvalue, int * n );
+extern void process_onenumarg( char * name, int argc, char ** argv, int * n );
+extern void process_twonumargs( char * name, int argc, char ** argv, int * m, int * n );
+extern int process_listnumargs( char * name, int argc, char ** argv, int * arr, int maxel );
+extern bool check_unsigned_int( char * val, int * n );
+extern bool check_unsigned_real( char * val, double * n );
diff --git a/challenge-208/duncan-c-white/C/ch-1.c b/challenge-208/duncan-c-white/C/ch-1.c
new file mode 100644
index 0000000000..a7d3a673e2
--- /dev/null
+++ b/challenge-208/duncan-c-white/C/ch-1.c
@@ -0,0 +1,176 @@
+//
+// Task 1: Minimum Index Sum
+//
+// C version.
+//
+
+#include <stdio.h>
+#include <stdlib.h>
+#include <stdbool.h>
+#include <string.h>
+#include <ctype.h>
+#include <assert.h>
+
+#include "args.h"
+#include "csvsplit.h"
+
+
+typedef struct
+{
+ char **arr; // array of 256 char *s
+ int nel;
+} strlist;
+
+
+void process1( char *str, void *extra )
+{
+ strlist *e = (strlist *)extra;
+ char *s = strdup( str );
+ assert( s != NULL );
+ e->arr[ e->nel++ ] = s;
+}
+
+
+void print_strlist( strlist *list )
+{
+ bool first = true;
+ for( int i=0; i<list->nel; i++ )
+ {
+ if( ! first ) putchar( ',' );
+ fputs( list->arr[i], stdout );
+ first = false;
+ }
+}
+
+
+// bool isin = in_strlist( word, &list );
+bool in_strlist( char *word, strlist *list )
+{
+ for( int i=0; i<list->nel; i++ )
+ {
+ if( strcmp( word, list->arr[i] ) == 0 )
+ {
+ return true;
+ }
+ }
+ return false;
+}
+
+
+// int sum = indexsum( word, &list1, &list2 );
+// Calculate and return the index sum of word in the two lists.
+int indexsum( char *word, strlist *list1, strlist *list2 )
+{
+ int sum = 0;
+ for( int pos=0; pos < list1->nel; pos++ )
+ {
+ if( strcmp( list1->arr[pos], word ) == 0 )
+ {
+ sum += pos;
+ }
+ }
+ for( int pos=0; pos < list2->nel; pos++ )
+ {
+ if( strcmp( list2->arr[pos], word ) == 0 )
+ {
+ sum += pos;
+ }
+ }
+ return sum;
+}
+
+
+int main( int argc, char **argv )
+{
+ int argno = process_flag_n_args( "mis", argc, argv,
+ 2, "wordlist wordlist" );
+
+ strlist list1;
+ list1.arr = malloc( 256*sizeof(char *) );
+ assert( list1.arr != NULL );
+ list1.nel = 0;
+ csvForeach( argv[argno++], &process1, &list1 );
+
+ strlist list2;
+ list2.arr = malloc( 256*sizeof(char *) );
+ assert( list2.arr != NULL );
+ list2.nel = 0;
+ csvForeach( argv[argno], &process1, &list2 );
+
+ if( debug )
+ {
+ printf( "list1: " );
+ print_strlist( &list1 );
+ putchar( '\n' );
+ printf( "list2: " );
+ print_strlist( &list2 );
+ putchar( '\n' );
+ }
+
+ strlist common;
+ common.arr = malloc( 256*sizeof(char *) );
+ assert( common.arr != NULL );
+ common.nel = 0;
+
+ for( int i=0; i<list1.nel; i++ )
+ {
+ // look for list1.arr[i] in list2
+ if( in_strlist( list1.arr[i], &list2 ) )
+ {
+ common.arr[common.nel++] = list1.arr[i];
+ }
+ }
+ if( debug )
+ {
+ printf( "There are %d common strings: ", common.nel );
+ print_strlist( &common );
+ putchar( '\n' );
+ }
+
+ int mis = list1.nel + list2.nel;
+ strlist best;
+ best.arr = malloc( 256*sizeof(char *) );
+ assert( best.arr != NULL );
+ best.nel = 0;
+
+ for( int pos=0; pos<common.nel; pos++ )
+ {
+ char *w = common.arr[pos];
+ int s = indexsum( w, &list1, &list2 );
+ if( debug )
+ {
+ printf( "The index sum of %s is %d\n", w, s );
+ }
+ if( s < mis )
+ {
+ mis = s;
+ best.arr[0] = w;
+ best.nel = 1;
+ } else if( s == mis )
+ {
+ best.arr[best.nel++] = w;
+ }
+ }
+
+ putchar( '(' );
+ print_strlist( &best );
+ putchar( ')' );
+ putchar( '\n' );
+
+ for( int i=0; i<list1.nel; i++ )
+ {
+ free( list1.arr[i] );
+ }
+ free( list1.arr );
+ for( int i=0; i<list2.nel; i++ )
+ {
+ free( list2.arr[i] );
+ }
+ free( list2.arr );
+
+ free( common.arr );
+
+ free( best.arr );
+
+ return 0;
+}
diff --git a/challenge-208/duncan-c-white/C/ch-2.c b/challenge-208/duncan-c-white/C/ch-2.c
new file mode 100644
index 0000000000..2a7c1c4bb4
--- /dev/null
+++ b/challenge-208/duncan-c-white/C/ch-2.c
@@ -0,0 +1,121 @@
+//
+// Task 2: Duplicate and Missing
+//
+// C version.
+//
+
+#include <stdio.h>
+#include <stdlib.h>
+#include <stdbool.h>
+#include <string.h>
+#include <ctype.h>
+#include <assert.h>
+
+#include "args.h"
+#include "parseints.h"
+#include "printarray.h"
+
+
+// bool isin = in_list( target, arr, nel );
+bool in_list( int target, int *arr, int nel )
+{
+ for( int i=0; i<nel; i++ )
+ {
+ if( arr[i] == target ) return true;
+ }
+ return false;
+}
+
+
+int main( int argc, char **argv )
+{
+ int argno = process_flag_n_m_args( "h-index", argc, argv,
+ 1, 1000, "intlist" );
+
+ int nel;
+ int *list = parse_int_args( argc, argv, argno, &nel );
+
+ if( debug )
+ {
+ printf( "debug: initial list: " );
+ print_int_array( 60, nel, list, ',', stdout );
+ putchar( '\n' );
+ }
+
+ // check that it's sorted
+ int prev = list[0];
+ for( int i=1; i<nel; i++ )
+ {
+ if( list[i] < prev )
+ {
+ fprintf( stderr, "dum: not sorted at element %d\n",
+ list[i] );
+ exit(1);
+ }
+ prev = list[i];
+ }
+
+ int base = list[0];
+ int dup = -1;
+
+ // find any duplicate, and die if there's only one duplicate
+ for( int i=0; i<nel; i++ )
+ {
+ int expect = base+i;
+ int el = list[i];
+ if( el > expect )
+ {
+ fprintf( stderr, "dum: bad input element %d\n", el );
+ exit(1);
+ }
+ if( in_list( el, list, i ) )
+ {
+ if( dup > -1 )
+ {
+ fprintf( stderr, "dum: multiple duplicates "
+ "found at element %d\n", el );
+ exit(1);
+ }
+ dup = el;
+ }
+ }
+
+ if( dup == -1 )
+ {
+ printf( "-1\n" );
+ exit( 0 );
+ }
+
+ if( debug )
+ {
+ printf( "dup is %d\n", dup );
+ }
+
+ // missing is sole member of {B..B+N-1} - all el[i]
+ int missing = -1;
+
+ for( int i=0; i<nel; i++ )
+ {
+ int el = base+i;
+ if( ! in_list( el, list, nel ) )
+ {
+ missing = el;
+ if( debug )
+ {
+ printf( "found missing value %d\n", el );
+ }
+ }
+ }
+
+ if( missing == -1 )
+ {
+ fprintf( stderr, "No missing value found\n" );
+ exit(1);
+ }
+
+ printf( "(%d, %d)\n", dup, missing );
+
+ free( list );
+
+ return 0;
+}
diff --git a/challenge-208/duncan-c-white/C/csvsplit.c b/challenge-208/duncan-c-white/C/csvsplit.c
new file mode 100644
index 0000000000..20e375dabb
--- /dev/null
+++ b/challenge-208/duncan-c-white/C/csvsplit.c
@@ -0,0 +1,47 @@
+/*
+ * csvsplit.c: simple CSV splitting (csvForeach), useful utility function
+ *
+ * (C) Duncan C. White, May 2017
+ */
+
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <stdbool.h>
+#include <assert.h>
+
+#include "csvsplit.h"
+
+
+/*
+ * csvForeach( csvstring, &foreach_callback, (void *)extravalue );
+ * Split csvstring into each comma-separated field, calling the
+ * foreach calback for each comma-separated field, passing the
+ * value and extravalue as parameters to it. It doesn't deal
+ * with commas in quoted strings, however.
+ */
+void csvForeach( char *csvstring, csvforeachcb cb, void *extra )
+{
+ // we need to modify the string, so make a mutable copy..
+ char *copy = strdup( csvstring );
+
+ char *start = copy;
+ for(;;)
+ {
+ char *comma=strchr( start, ',' );
+ if( comma != NULL )
+ {
+ // found the first comma after start
+ *comma = '\0';
+ }
+ //printf( "debug: csvForeach: found value %s\n", start );
+ (*cb)( start, extra );
+
+ if( comma == NULL ) break;
+
+ // move start to one beyond where comma was..
+ start = comma+1;
+ }
+ // don't forget to..
+ free( copy );
+}
diff --git a/challenge-208/duncan-c-white/C/csvsplit.h b/challenge-208/duncan-c-white/C/csvsplit.h
new file mode 100644
index 0000000000..c7f84857c1
--- /dev/null
+++ b/challenge-208/duncan-c-white/C/csvsplit.h
@@ -0,0 +1,14 @@
+/*
+ * csvsplit.h: simple CSV splitting (csvForeach) - doesn't handle
+ * quoted fields with nested commas.
+ *
+ * (C) Duncan C. White, May 2017
+ */
+
+// a csv foreach callback function takes
+// a char * (the csv value split out)
+// and a void * (an extra value).
+
+typedef void (*csvforeachcb)( char *, void * );
+
+extern void csvForeach( char * csvstring, csvforeachcb cb, void * extra );
diff --git a/challenge-208/duncan-c-white/C/parseints.c b/challenge-208/duncan-c-white/C/parseints.c
new file mode 100644
index 0000000000..80408d3382
--- /dev/null
+++ b/challenge-208/duncan-c-white/C/parseints.c
@@ -0,0 +1,114 @@
+// Simple routine to parse one or more arguments,
+// looking for individual +ints or comma-separated
+// lists of +ints.
+//
+
+#include <stdio.h>
+#include <stdlib.h>
+#include <stdbool.h>
+#include <string.h>
+#include <ctype.h>
+#include <assert.h>
+
+#include "args.h"
+#include "printarray.h"
+#include "parseints.h"
+
+typedef struct
+{
+ int nel; // current number of elements
+ int maxel; // maximum number of elements allocated
+ int *list; // malloc()d list of integers
+} intlist;
+
+
+//
+// intlist il.. then initialize il.. then:
+// add_one( element, &il );
+//
+static void add_one( int x, intlist *p )
+{
+ if( p->nel > p->maxel )
+ {
+ p->maxel += 128;
+ p->list = realloc( p->list, p->maxel );
+ assert( p->list != NULL );
+ }
+ #if 0
+ if( debug )
+ {
+ printf( "PIA: appending %d to result at "
+ "pos %d\n", x, p->nel );
+ }
+ #endif
+ p->list[p->nel++] = x;
+}
+
+
+//
+// intlist il.. then initialize il.. then:
+// add_one_arg( argstr, &il );
+//
+static void add_one_arg( char *argstr, intlist *p )
+{
+ int x;
+ if( !check_unsigned_int(argstr,&x) )
+ {
+ fprintf( stderr, "PIA: arg %s must be +int\n", argstr );
+ exit(1);
+ }
+ add_one( x, p );
+}
+
+
+//
+// int nel;
+// int *ilist = parse_int_args( argc, argv, argno, &nel );
+// process all arguments argv[argno..argc-1], extracting either
+// single ints or comma-separated lists of ints from those arguments,
+// accumulate all integers in a dynarray list, storing the total number
+// of elements in nel. This list must be freed by the caller.
+// Note that the list of elements used to be terminated by a -1 value,
+// but I've commented this out from now on.
+//
+int *parse_int_args( int argc, char **argv, int argno, int *nel )
+{
+ int *result = malloc( 128 * sizeof(int) );
+ assert( result != NULL );
+ intlist il = { 0, 128, result };
+
+ #if 0
+ if( debug )
+ {
+ printf( "PIA: parsing ints from args %d..%d\n", argno, argc-1 );
+ }
+ #endif
+ for( int i=argno; i<argc; i++ )
+ {
+ assert( strlen(argv[i]) < 1024 );
+ char copy[1024];
+ strcpy( copy, argv[i] );
+ char *com;
+ char *s;
+ for( s=copy; (com = strchr(s,',')) != NULL; s=com+1 )
+ {
+ *com = '\0';
+ add_one_arg( s, &il );
+ }
+ add_one_arg( s, &il );
+ }
+
+ //add_one( -1, &il );
+
+ #if 0
+ if( debug )
+ {
+ printf( "PIA: final list is " );
+ print_int_array( 80, il.nel, il.list, ',', stdout );
+ putchar( '\n' );
+ }
+ #endif
+
+ *nel = il.nel;
+ return il.list;
+}
diff --git a/challenge-208/duncan-c-white/C/parseints.h b/challenge-208/duncan-c-white/C/parseints.h
new file mode 100644
index 0000000000..da5e145a86
--- /dev/null
+++ b/challenge-208/duncan-c-white/C/parseints.h
@@ -0,0 +1 @@
+extern int * parse_int_args( int argc, char ** argv, int argno, int * nel );
diff --git a/challenge-208/duncan-c-white/C/printarray.c b/challenge-208/duncan-c-white/C/printarray.c
new file mode 100644
index 0000000000..ddee597df3
--- /dev/null
+++ b/challenge-208/duncan-c-white/C/printarray.c
@@ -0,0 +1,39 @@
+#include <stdio.h>
+#include <string.h>
+
+
+// print_int_array( maxw, nelements, results[], sep, outfile );
+// format results[0..nelements-1] as a <sep> separated
+// list onto outfile with lines <= maxw chars long.
+// produces a whole number of lines of output - without the trailing '\n'
+void print_int_array( int maxw, int nel, int *results, char sep, FILE *out )
+{
+ int linelen = 0;
+ for( int i=0; i<nel; i++ )
+ {
+ char buf[100];
+ sprintf( buf, "%d", results[i] );
+ int len = strlen(buf);
+ if( linelen + len + 2 > maxw )
+ {
+ fputc( '\n', out );
+ linelen = 0;
+ } else if( i>0 )
+ {
+ fputc( ' ', out );
+ linelen++;
+ }
+
+ linelen += len;
+ fprintf( out, "%s", buf );
+ if( i<nel-1 )
+ {
+ fputc( sep, out );
+ linelen++;
+ }
+ }
+ //if( linelen>0 )
+ //{
+ // fputc( '\n', out );
+ //}
+}
diff --git a/challenge-208/duncan-c-white/C/printarray.h b/challenge-208/duncan-c-white/C/printarray.h
new file mode 100644
index 0000000000..40efb83277
--- /dev/null
+++ b/challenge-208/duncan-c-white/C/printarray.h
@@ -0,0 +1 @@
+extern void print_int_array( int maxw, int nel, int * results, char sep, FILE * out );
diff --git a/challenge-208/duncan-c-white/README b/challenge-208/duncan-c-white/README
index c6faef5c45..80916b64a2 100644
--- a/challenge-208/duncan-c-white/README
+++ b/challenge-208/duncan-c-white/README
@@ -1,67 +1,86 @@
-Task 1: Keyboard Word
+Task 1: Minimum Index Sum
-You are given an array of words. Write a script to print all the words
-in the given array that can be typed using alphabet on only one row of
-the keyboard.
+You are given two arrays of strings. Write a script to find out all
+common strings in the given two arrays with minimum index sum. If no
+common strings are found returns an empty list.
-Let us assume the keys are arranged as below:
+Example 1
-Row 1: qwertyuiop
-Row 2: asdfghjkl
-Row 3: zxcvbnm
+Input: @list1 = ("Perl", "Raku", "Love")
+ @list2 = ("Raku", "Perl", "Hate")
-Example 1
+Output: ("Perl", "Raku")
- Input: @words = ("Hello","Alaska","Dad","Peace")
- Output: ("Alaska","Dad")
+There are two common strings "Perl" and "Raku".
+Index sum of "Perl": 0 + 1 = 1
+Index sum of "Raku": 1 + 0 = 1
Example 2
- Input: @array = ("OMG","Bye")
- Output: ()
+Input: @list1 = ("A", "B", "C")
+ @list2 = ("D", "E", "F")
+
+Output: ()
+
+No common string found, so no result.
+
+Example 3
-MY NOTES: very easy. Lower case each word, then match it against /^[qwertyuiop]+$/ for the first row, similarly regexes for the second and third rows.
+Input: @list1 = ("A", "B", "C")
+ @list2 = ("C", "A", "B")
+
+Output: ("A")
+
+There are three common strings "A", "B" and "C".
+Index sum of "A": 0 + 1 = 1
+Index sum of "B": 1 + 2 = 3
+Index sum of "C": 2 + 0 = 2
+
+MY NOTES: very easy. Identify whether any common strings exist: set
+intersection. Then calculate index sum of all common strings and choose
+the minimum ones. Trickiest thing to work out is how to input two lists
+of strings - let's choose an arbitrary separator ':'..
GUEST LANGUAGE: As a bonus, I also had a go at translating ch-1.pl into C
-(look in the C directory for that). replaced regexes with a custom: match a
-sequence of <these chars:string>.
+(look in the C directory for that).
-Task 2: H-Index
+Task 2: Duplicate and Missing
-You are given an array of integers containing citations a researcher
-has received for each paper. Write a script to compute the researcher's
-H-Index. For more information please checkout:
+You are given an array of integers in sequence with one missing and one
+duplicate. Write a script to find the duplicate and missing integer in
+the given array. Return -1 if none found. For the sake of this task,
+let us assume the array contains no more than one duplicate and missing.
-https://en.wikipedia.org/wiki/H-index
+Example 1:
-The H-Index is the largest number h such that h articles have at least
-h citations each. For example, if an author has five publications, with
-9, 7, 6, 2, and 1 citations (ordered from greatest to least), then the
-author's H-index is 3, because the author has three publications with 3
-or more citations. However, the author does not have four publications
-with 4 or more citations.
+ Input: @nums = (1,2,2,4)
+ Output: (2,3)
+ Duplicate is 2 and Missing is 3.
-Example 1
+Example 2:
- Input: @citations = (10,8,5,4,3)
- Output: 4
+ Input: @nums = 1,2,3,4
+ Output: -1
-Because the 4th publication has 4 citations and the 5th has only 3.
+ No duplicate and missing found.
-Example 2
+Example 3:
- Input: @citations = (25,8,5,3,3)
- Output: 3
+ Input: @nums = (1,2,3,3)
+ Output: (3,4)
-The H-Index is 3 because the fourth paper has only 3 citations.
+ Duplicate is 3 and Missing is 4.
-MY NOTES: also pretty easy. The Wikipedia entry sheds more light:
+MY NOTES: also pretty easy - especially if the list of integers should (if it
+were not for the one missing and one duplicated) form the sequence 1..N.
+if so: the duplicate is the element where el[i] != i.
+The missing is the sole member of set {1..N} - all el[i]
-"First we order the citations from the largest to the lowest value.
- Then, we look for the last position in which citation[h] >= h."
- (This assumes array indexes start at 1, I think).
+Let's generalise it slightly to B, B+1, .. B+N-1. Then: find the element
+where el[i] != el[0]+i, that is the duplicate, and the missing is the sole
+member of {B..N+N-1} - all el[i]
GUEST LANGUAGE: As a bonus, I also had a go at translating ch-2.pl into C
(look in the C directory for that)
diff --git a/challenge-208/duncan-c-white/perl/ch-1.pl b/challenge-208/duncan-c-white/perl/ch-1.pl
new file mode 100755
index 0000000000..66a0357f0b
--- /dev/null
+++ b/challenge-208/duncan-c-white/perl/ch-1.pl
@@ -0,0 +1,108 @@
+#!/usr/bin/perl
+#
+# Task 1: Minimum Index Sum
+#
+# You are given two arrays of strings. Write a script to find out all
+# common strings in the given two arrays with minimum index sum. If no
+# common strings are found returns an empty list.
+#
+# Example 1
+#
+# Input: @list1 = ("Perl", "Raku", "Love")
+# @list2 = ("Raku", "Perl", "Hate")
+#
+# Output: ("Perl", "Raku")
+#
+# There are two common strings "Perl" and "Raku".
+# Index sum of "Perl": 0 + 1 = 1
+# Index sum of "Raku": 1 + 0 = 1
+#
+# Example 2
+#
+# Input: @list1 = ("A", "B", "C")
+# @list2 = ("D", "E", "F")
+#
+# Output: ()
+#
+# No common string found, so no result.
+#
+# Example 3
+#
+# Input: @list1 = ("A", "B", "C")
+# @list2 = ("C", "A", "B")
+#
+# Output: ("A")
+#
+# There are three common strings "A", "B" and "C".
+# Index sum of "A": 0 + 1 = 1
+# Index sum of "B": 1 + 2 = 3
+# Index sum of "C": 2 + 0 = 2
+#
+# MY NOTES: very easy. Identify whether any common strings exist: set
+# intersection. Then calculate index sum of all common strings and choose
+# the minimum ones. Trickiest thing to work out is how to input two lists
+# of strings - let's assume that they come as two command line args eg.
+# A,B,C and C,A,B
+#
+# GUEST LANGUAGE: As a bonus, I also had a go at translating ch-1.pl into C
+# (look in the C directory for that).
+#
+
+use strict;
+use warnings;
+use feature 'say';
+use Getopt::Long;
+use Data::Dumper;
+
+my $debug=0;
+die "Usage: mis [--debug] word-list word-list\n"
+ unless GetOptions( "debug"=>\$debug ) && @ARGV==2;
+
+my( $list1, $list2 ) = @ARGV;
+my @list1 = split( /,/, $list1 );
+my @list2 = split( /,/, $list2 );
+
+#say "list1: ", join(',',@list1) if $debug;
+#say "list2: ", join(',',@list2) if $debug;
+
+my %set1 = map { $_ => 1 } @list1;
+
+# my $sum = indexsum( $word, \@list1, \@list2 );
+# Calculate and return the index sum of $word in the two lists.
+#
+sub indexsum
+{
+ my( $word, $list1, $list2 ) = @_;
+ my $sum = 0;
+ foreach my $pos (0..$#$list1)
+ {
+ $sum += $pos if $list1[$pos] eq $word;
+ }
+ foreach my $pos (0..$#$list2)
+ {
+ $sum += $pos if $list2[$pos] eq $word;
+ }
+ return $sum;
+}
+
+my @common = grep { $set1{$_} } @list2;
+my $nc = @common;
+say "There are $nc common strings: ", join(',',@common) if $debug;
+
+my $mis = @list1 + @list2;
+my @best = ();
+foreach my $w (@common)
+{
+ my $s = indexsum( $w, \@list1, \@list2 );