1 files changed, 762 insertions, 0 deletions
diff --git a/bwb_str.c b/bwb_str.c
new file mode 100644
index 0000000..fdf68a8
--- /dev/null
+++ b/bwb_str.c
@@ -0,0 +1,762 @@
+/***************************************************************
+  
+   bwb_str.c       String-Management Routines
+                        for Bywater BASIC Interpreter
+  
+                        Copyright (c) 1993, Ted A. Campbell
+                        Bywater Software
+  
+                        email: tcamp@delphi.com
+  
+        Copyright and Permissions Information:
+  
+        All U.S. and international rights are claimed by the author,
+        Ted A. Campbell.
+  
+   This software is released under the terms of the GNU General
+   Public License (GPL), which is distributed with this software
+   in the file "COPYING".  The GPL specifies the terms under
+   which users may copy and use the software in this distribution.
+  
+   A separate license is available for commercial distribution,
+   for information on which you should contact the author.
+  
+***************************************************************/
+
+/*---------------------------------------------------------------*/
+/* NOTE: Modifications marked "JBV" were made by Jon B. Volkoff, */
+/* 11/1995 (eidetics@cerf.net).                                  */
+/*                                                               */
+/* Those additionally marked with "DD" were at the suggestion of */
+/* Dale DePriest (daled@cadence.com).                            */
+/*                                                               */
+/* Version 3.00 by Howard Wulf, AF5NE                            */
+/*                                                               */
+/* Version 3.10 by Howard Wulf, AF5NE                            */
+/*                                                               */
+/* Version 3.20 by Howard Wulf, AF5NE                            */
+/*                                                               */
+/*---------------------------------------------------------------*/
+
+
+
+/***************************************************************
+
+BASIC allows embedded NUL (0) characters.  C str*() does not. 
+
+ALL the StringType code should use mem*() and ->length.
+ALL the StringType code should prevent string overflow.
+
+***************************************************************/
+
+
+
+
+#include "bwbasic.h"
+
+
+static int CharListToSet (char *pattern, int start, int stop);
+static int IndexOf (char *buffer, char find, int start);
+
+
+/***************************************************************
+  
+        FUNCTION:       str_btob()
+  
+        DESCRIPTION:    This C function assigns a bwBASIC string
+         structure to another bwBASIC string
+         structure.
+  
+***************************************************************/
+
+int
+str_btob (StringType * d, StringType * s)
+{
+   
+  assert (d != NULL);
+  assert (s != NULL);
+  /*  assert( s->length >= 0 ); */
+  assert( My != NULL );
+
+  if (s->length > MAXLEN)
+  {
+    WARN_STRING_TOO_LONG;        /* str_btob */
+    s->length = MAXLEN;
+  }
+
+  /* get memory for new buffer */
+  if (d->sbuffer != NULL)
+  {
+    /* free the destination's buffer */
+    if (d->sbuffer == My->MaxLenBuffer)
+    {
+      /*
+      ** this occurs when setting the return value of a multi-line string user function
+      **
+      ** FUNCTION INKEY$
+      **   DIM A$
+      **   LINE INPUT A$
+      **   LET INKEY$ = LEFT$( A$, 1 )
+      ** END FUNCTION
+      **
+      */
+    }
+    else if (d->sbuffer == My->ConsoleOutput)
+    {
+      /* this should never occur, but let's make sure we don't crash if it does */
+      WARN_INTERNAL_ERROR;
+      /* continue processing */
+    }
+    else if (d->sbuffer == My->ConsoleInput)
+    {
+      /* this should never occur, but let's make sure we don't crash if it does */
+      WARN_INTERNAL_ERROR;
+      /* continue processing */
+    }
+    else
+    {
+      free (d->sbuffer);
+      d->sbuffer = NULL;
+    }
+    d->sbuffer = NULL;
+    d->length = 0;
+  }
+  if (d->sbuffer == NULL)
+  {
+    /* allocate the destination's buffer */
+    d->length = 0;
+    if ((d->sbuffer =
+         (char *) calloc (s->length + 1 /* NulChar */ ,
+                          sizeof (char))) == NULL)
+    {
+      WARN_OUT_OF_MEMORY;
+      return FALSE;
+    }
+  }
+  /* write the b string to the b string */
+  assert( d->sbuffer != NULL );
+  if( s->length > 0 )
+  { 
+    assert( s->sbuffer != NULL );
+    bwb_memcpy (d->sbuffer, s->sbuffer, s->length);
+  }
+  d->length = s->length;
+  d->sbuffer[d->length] = NulChar;
+  return TRUE;
+}
+
+
+/***************************************************************
+  
+        FUNCTION:       str_cmp()
+  
+   DESCRIPTION:    This C function performs the equivalent
+         of the C strcmp() function, using BASIC
+         strings.
+  
+***************************************************************/
+
+int
+str_cmp (StringType * a, StringType * b)
+{
+   
+  assert (a != NULL);
+  assert (b != NULL);
+  assert( My != NULL );
+  assert( My->CurrentVersion != NULL );
+
+  if (a->length > MAXLEN)
+  {
+    WARN_STRING_TOO_LONG;        /* str_cmp */
+    a->length = MAXLEN;
+  }
+  if (b->length > MAXLEN)
+  {
+    WARN_STRING_TOO_LONG;        /* str_cmp */
+    b->length = MAXLEN;
+  }
+  if (a->sbuffer == NULL)
+  {
+    if (b->sbuffer == NULL)
+    {
+      return 0;
+    }
+    if (b->length == 0)
+    {
+      return 0;
+    }
+    return 1;
+  }
+  assert( a->sbuffer != NULL );
+  a->sbuffer[a->length] = NulChar;
+
+  if (b->sbuffer == NULL)
+  {
+    if (a->sbuffer == NULL)
+    {
+      return 0;
+    }
+    if (a->length == 0)
+    {
+      return 0;
+    }
+    return -1;
+  }
+  assert( b->sbuffer != NULL );
+  b->sbuffer[b->length] = NulChar;
+
+  if (My->CurrentVersion->OptionFlags & OPTION_COMPARE_TEXT)
+  {
+    /* case insensitive */
+    return bwb_stricmp (a->sbuffer, b->sbuffer);        /* NOTE: embedded NUL characters terminate comparison */
+  }
+  else
+  {
+    /* case sensitive */
+    return bwb_strcmp (a->sbuffer, b->sbuffer);        /* NOTE: embedded NUL characters terminate comparison */
+  }
+}
+
+/***************************************************************
+
+                     MATCH
+
+***************************************************************/
+
+int
+str_match (char *A, int A_Length, char *B, int B_Length, int I_Start)
+{
+  /*
+     SYNTAX: j% = MATCH( a$, b$, i% )
+
+     MATCH returns the position of the first occurrence of a$ in b$ 
+     starting with the character position given by the third parameter. 
+     A zero is returned if no MATCH is found. 
+
+     The following pattern-matching features are available: 
+     # matches any digit (0-9). 
+     ! matches any upper-or lower-case letter. 
+     ? matches any character. 
+     \ serves as an escape character indicating the following character does not have special meaning. 
+
+     For example, a ? signifies any character is a MATCH unless preceded by a \. 
+     a$ and b$ must be strings. 
+     If either of these arguments are numeric, an error occurs. 
+     If i% is real, it is converted to an integer. 
+     If i% is a string, an error occurs. 
+     If i% is negative or zero, a run-time error occurs. 
+     When i% is greater than the length of b$, zero is returned. 
+     If b$ is a null string, a 0 is returned. 
+     If b$ is not null, but a$ is null, a 1 is returned.    
+
+     Examples: 
+     MATCH( "is", "Now is the", 1) returns 5
+     MATCH( "##", "October 8, 1876", 1) returns 12
+     MATCH( "a?", "character", 4 ) returns 5
+     MATCH( "\#", "123#45", 1) returns 4
+     MATCH( "ABCD", "ABC", 1 ) returns 0
+     MATCH( "\#1\\\?", "1#1\?2#", 1 ) returns 2
+   */
+
+
+  int a;                        /* current position in A$ */
+  int b;                        /* current position in B$ */
+   
+  assert (A != NULL);
+  assert (B != NULL);
+
+
+  if (I_Start <= 0)
+  {
+    return 0;
+  }
+  if (I_Start > B_Length)
+  {
+    return 0;
+  }
+  if (B_Length <= 0)
+  {
+    return 0;
+  }
+  if (A_Length <= 0)
+  {
+    return 1;
+  }
+  I_Start--;                        /* BASIC to C */
+  for (b = I_Start; b < B_Length; b++)
+  {
+    int n;                        /* number of characters in A$ matched with B$ */
+
+    n = 0;
+    for (a = 0; a < A_Length; a++)
+    {
+      int bn;
+      bn = b + n;
+      if (A[a] == '#' && bwb_isdigit (B[bn]))
+      {
+        n++;
+      }
+      else if (A[a] == '!' && bwb_isalpha (B[bn]))
+      {
+        n++;
+      }
+      else if (A[a] == '?')
+      {
+        n++;
+      }
+      else if (a < (A_Length - 1) && A[a] == '\\' && A[a + 1] == B[bn])
+      {
+        n++;
+        a++;
+      }
+      else if (A[a] == B[bn])
+      {
+        n++;
+      }
+      else
+      {
+        break;
+      }
+    }
+    if (a == A_Length)
+    {
+      b++;                        /* C to BASIC */
+      return b;
+    }
+  }
+  return 0;
+}
+
+
+
+/***************************************************************
+  
+        FUNCTION:       str_like()
+  
+   DESCRIPTION:    This C function performs the equivalent
+         of the BASIC LIKE operator, using BASIC
+         strings.
+  
+***************************************************************/
+
+/* 
+inspired by http://www.blackbeltcoder.com/Articles/net/implementing-vbs-like-operator-in-c 
+*/
+
+/*
+KNOWN ISSUES:
+To match the character '[', use "[[]".
+To match the character '?', use "[?]".
+To match the character '*', use "[*]".
+Does not match "" with "[]" or "[!]".
+*/
+
+#define CHAR_SET '*'
+#define CHAR_CLR ' '
+
+static char charList[256];
+
+static int
+IndexOf (char *buffer, char find, int start)
+{
+  int buffer_count;
+  int buffer_length;
+   
+  assert (buffer != NULL);
+  assert( My != NULL );
+  assert( My->CurrentVersion != NULL );
+
+  buffer_length = bwb_strlen (buffer);
+
+  if (My->CurrentVersion->OptionFlags & OPTION_COMPARE_TEXT)
+  {
+    find = bwb_toupper (find);
+  }
+
+  for (buffer_count = start; buffer_count < buffer_length; buffer_count++)
+  {
+    char theChar;
+
+    theChar = buffer[buffer_count];
+
+    if (My->CurrentVersion->OptionFlags & OPTION_COMPARE_TEXT)
+    {
+      theChar = bwb_toupper (theChar);
+    }
+
+
+    if (theChar == find)
+    {
+      /* FOUND */
+      return buffer_count;
+    }
+
+  }
+  /* NOT FOUND */
+  return -1;
+}
+
+
+static int
+CharListToSet (char *pattern, int start, int stop)
+{
+  /*
+     Converts a string of characters to a HashSet of characters. If the string
+     contains character ranges, such as A-Z, all characters in the range are
+     also added to the returned set of characters.
+   */
+  int pattern_Count;
+   
+  assert (pattern != NULL);
+
+  bwb_memset (charList, CHAR_CLR, 256);
+
+  if (start > stop)
+  {
+    /* ERROR */
+    return FALSE;
+  }
+  /* Leading '-' */
+  while (pattern[start] == '-')
+  {
+    /* Match character '-' */
+
+    charList[0x00FF & pattern[start]] = CHAR_SET;
+    start++;
+    if (start > stop)
+    {
+      /* DONE */
+      return TRUE;
+    }
+  }
+  /* Trailing '-' */
+  while (pattern[stop] == '-')
+  {
+    /* Match character '-' */
+    charList[0x00FF & pattern[stop]] = CHAR_SET;
+    stop--;
+    if (start > stop)
+    {
+      /* DONE */
+      return TRUE;
+    }
+  }
+
+
+  for (pattern_Count = start; pattern_Count <= stop; pattern_Count++)
+  {
+    if (pattern[pattern_Count] == '-')
+    {
+      /* Character range */
+
+      char startChar;
+      char endChar;
+      char theChar;
+
+      if (pattern_Count > start)
+      {
+        startChar = pattern[pattern_Count - 1];
+        if (startChar == '-')
+        {
+          /* ERROR */
+          return FALSE;
+        }
+        if (My->CurrentVersion->OptionFlags & OPTION_COMPARE_TEXT)
+        {
+          startChar = bwb_toupper (startChar);
+        }
+      }
+      else
+      {
+        /* ERROR */
+        return FALSE;
+      }
+      if (pattern_Count < stop)
+      {
+        endChar = pattern[pattern_Count + 1];
+        if (endChar == '-')
+        {
+          /* ERROR */
+          return FALSE;
+        }
+        if (My->CurrentVersion->OptionFlags & OPTION_COMPARE_TEXT)
+        {
+          endChar = bwb_toupper (endChar);
+        }
+        if (endChar < startChar)
+        {
+          /* ERROR */
+          return FALSE;
+        }
+      }
+      else
+      {
+        /* ERROR */
+        return FALSE;
+      }
+      /* 
+         Although the startChar has already been set,
+         and the endChar will be set on the next loop,
+         we go ahead and set them here too.
+         Not the most efficient, but easy to understand,
+         and we do not have to do anything special
+         for edge cases such as [A-A] and [A-B].  
+       */
+      for (theChar = startChar; theChar <= endChar; theChar++)
+      {
+        charList[0x00FF & theChar] = CHAR_SET;
+      }
+    }
+    else
+    {
+      /* Single character */
+      char theChar;
+
+      theChar = pattern[pattern_Count];
+      if (My->CurrentVersion->OptionFlags & OPTION_COMPARE_TEXT)
+      {
+        theChar = bwb_toupper (theChar);
+      }
+      charList[0x00FF & theChar] = CHAR_SET;
+    }
+  }
+
+  return TRUE;
+}
+
+
+
+int
+IsLike (char *buffer, int *buffer_count, int buffer_Length,
+        char *pattern, int *pattern_count, int pattern_Length)
+{
+
+  /* Implement's VB's Like operator logic. */
+
+  /* 
+     if matched then
+     buffer_count is updated
+     pattern_count is updated
+     returns TRUE
+     else
+     returns FALSE
+     end if
+   */
+
+  int bc;
+  int pc;
+   
+  assert (buffer != NULL);
+  assert (buffer_count != NULL);
+  assert (pattern != NULL);
+  assert (pattern_count != NULL);
+  assert( My != NULL );
+  assert( My->CurrentVersion != NULL );
+
+  bc = *buffer_count;
+  pc = *pattern_count;
+
+
+  /* Loop through pattern string */
+  while (pc < pattern_Length)
+  {
+
+    /* Get next pattern character */
+    if (pattern[pc] == '[')
+    {
+      /* Character list */
+      /* [] and [!] are special */
+      char IsExclude;
+
+      IsExclude = CHAR_CLR;
+      pc++;
+      /* pc is first character after '[' */
+      if (pattern[pc] == '!')
+      {
+        pc++;
+        IsExclude = CHAR_SET;
+      }
+      /* pc is first character after '[' */
+      if (pattern[pc] == ']')
+      {
+        /* [] and [!] are special */
+        /* pc is first character after '[' and is a ']' */
+        pc++;
+        if (IsExclude == CHAR_CLR)
+        {
+          /* [] */
+          /* matches "" */
+        }
+        else
+        {
+          /* [!] */
+          /* same as '?' */
+          if (bc >= buffer_Length)
+          {
+            /* we have completed the buffer without completing the pattern */
+            return FALSE;
+          }
+          bc++;
+        }
+      }
+      else
+      {
+        /* Build character list */
+        /* pc is first character after '[' and is not a ']' */
+        int stop_count;
+
+        stop_count = IndexOf (pattern, ']', pc);
+        /* stop_count is the character ']' */
+        if (stop_count < 0)
+        {
+          /* NOT FOUND */
+          return FALSE;
+        }
+        /* pc is first character after '['  */
+        /* stop_count is the character ']' */
+        CharListToSet (pattern, pc, stop_count - 1);
+        pc = stop_count + 1;
+        /* pc is first character after ']' */
+        if (bc >= buffer_Length)
+        {
+          /* we have completed the buffer without completing the pattern */
+          return FALSE;
+        }
+        if (charList[0x00FF & buffer[bc]] == IsExclude)
+        {
+          /* not matched */
+          return FALSE;
+        }
+        bc++;
+      }
+    }
+    else if (pattern[pc] == '?' /* LIKE char */ )
+    {
+      /* Matches a single character */
+      pc++;
+      if (bc >= buffer_Length)
+      {
+        /* Check for end of string */
+        /* we have completed the buffer without completing the pattern */
+        return FALSE;
+      }
+      bc++;
+    }
+    else if (pattern[pc] == '#' /* LIKE digit */ )
+    {
+      /* Matches a single digit */
+      pc++;
+      if (bc >= buffer_Length)
+      {
+        /* Check for end of string */
+        /* we have completed the buffer without completing the pattern */
+        return FALSE;
+      }
+      if (bwb_isdigit (buffer[bc]))
+      {
+        bc++;
+      }
+      else
+      {
+        /* not matched */
+        return FALSE;
+      }
+    }
+    else if (pattern[pc] == '*' /* LIKE chars */ )
+    {
+      /* Zero or more characters */
+      while (pattern[pc] == '*' /* LIKE chars */ )
+      {
+        pc++;
+      }
+      if (pc == pattern_Length)
+      {
+        /* Matches all remaining characters */
+        bc = buffer_Length;
+        pc = pattern_Length;
+        break;
+      }
+      else
+      {
+        int p;
+        int b;
+        int IsMatched;
+
+        p = pc;
+        b = bc;
+        IsMatched = FALSE;
+        while (b <= buffer_Length && IsMatched == FALSE)
+        {
+          int last_b;
+
+          last_b = b;
+          IsMatched =
+            IsLike (buffer, &b, buffer_Length, pattern, &p, pattern_Length);
+          if (IsMatched == FALSE)
+          {
+            /* not matched, try again begining at next buffer position */
+            p = pc;
+            b = last_b + 1;
+          }
+        }
+        if (IsMatched == FALSE)
+        {
+          /* not matched */
+          return FALSE;
+        }
+        pc = p;
+        bc = b;
+      }
+    }
+    else
+    {
+      char pattChar;
+      char buffChar;
+
+      pattChar = pattern[pc];
+      if (bc >= buffer_Length)
+      {
+        /* Check for end of string */
+        /* we have completed the buffer without completing the pattern */
+        return FALSE;
+      }
+      buffChar = buffer[bc];
+
+      if (My->CurrentVersion->OptionFlags & OPTION_COMPARE_TEXT)
+      {
+        pattChar = bwb_toupper (pattChar);
+        buffChar = bwb_toupper (buffChar);
+      }
+
+      if (pattChar == buffChar)
+      {
+        /* matched specified character */
+        pc++;
+        bc++;
+      }
+      else
+      {
+        /* not matched */
+        return FALSE;
+      }
+    }
+  }
+  /* Return true if all characters matched */
+  if (pc < pattern_Length)
+  {
+    /* not matched */
+    return FALSE;
+  }
+  if (bc < buffer_Length)
+  {
+    /* not matched */
+    return FALSE;
+  }
+  /* all characters matched */
+  *buffer_count = bc;
+  *pattern_count = pc;
+  return TRUE;
+}
+
+
+/* EOF */