git.fiddlerwoaroof.com
Source/AGRegex/pcre-4.3/maketables.c
0c532ca4
 /*************************************************
0223e6a6
  *      Perl-Compatible Regular Expressions       *
  *************************************************/
0c532ca4
 
 /*
0223e6a6
  PCRE is a library of functions to support regular expressions whose syntax
  and semantics are as close as possible to those of the Perl 5 language.
  
  Written by: Philip Hazel <ph10@cam.ac.uk>
  
  Copyright (c) 1997-2003 University of Cambridge
  
  -----------------------------------------------------------------------------
  Permission is granted to anyone to use this software for any purpose on any
  computer system, and to redistribute it freely, subject to the following
  restrictions:
  
  1. This software is distributed in the hope that it will be useful,
  but WITHOUT ANY WARRANTY; without even the implied warranty of
  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  
  2. The origin of this software must not be misrepresented, either by
  explicit claim or by omission.
  
  3. Altered versions must be plainly marked as such, and must not be
  misrepresented as being the original software.
  
  4. If PCRE is embedded in any software that is released under the GNU
  General Purpose Licence (GPL), then the terms of that licence shall
  supersede any condition above with which it is incompatible.
  -----------------------------------------------------------------------------
  
  See the file Tech.Notes for some information on the internals.
  */
0c532ca4
 
 
 /* This file is compiled on its own as part of the PCRE library. However,
0223e6a6
  it is also included in the compilation of dftables.c, in which case the macro
  DFTABLES is defined. */
0c532ca4
 
 #ifndef DFTABLES
 #include "internal.h"
 #endif
 
 
 
 /*************************************************
0223e6a6
  *           Create PCRE character tables         *
  *************************************************/
0c532ca4
 
 /* This function builds a set of character tables for use by PCRE and returns
0223e6a6
  a pointer to them. They are build using the ctype functions, and consequently
  their contents will depend upon the current locale setting. When compiled as
  part of the library, the store is obtained via pcre_malloc(), but when compiled
  inside dftables, use malloc().
  
  Arguments:   none
  Returns:     pointer to the contiguous block of data
  */
0c532ca4
 
 const unsigned char *
 pcre_maketables(void)
 {
0223e6a6
     unsigned char *yield, *p;
     int i;
     
0c532ca4
 #ifndef DFTABLES
0223e6a6
     yield = (unsigned char*)(pcre_malloc)(tables_length);
0c532ca4
 #else
0223e6a6
     yield = (unsigned char*)malloc(tables_length);
0c532ca4
 #endif
0223e6a6
     
     if (yield == NULL) return NULL;
     p = yield;
     
     /* First comes the lower casing table */
     
     for (i = 0; i < 256; i++) *p++ = tolower(i);
     
     /* Next the case-flipping table */
     
     for (i = 0; i < 256; i++) *p++ = islower(i)? toupper(i) : tolower(i);
     
     /* Then the character class tables. Don't try to be clever and save effort
      on exclusive ones - in some locales things may be different. Note that the
      table for "space" includes everything "isspace" gives, including VT in the
      default locale. This makes it work for the POSIX class [:space:]. */
     
     memset(p, 0, cbit_length);
     for (i = 0; i < 256; i++)
0c532ca4
     {
0223e6a6
         if (isdigit(i))
         {
             p[cbit_digit  + i/8] |= 1 << (i&7);
             p[cbit_word   + i/8] |= 1 << (i&7);
         }
         if (isupper(i))
         {
             p[cbit_upper  + i/8] |= 1 << (i&7);
             p[cbit_word   + i/8] |= 1 << (i&7);
         }
         if (islower(i))
         {
             p[cbit_lower  + i/8] |= 1 << (i&7);
             p[cbit_word   + i/8] |= 1 << (i&7);
         }
         if (i == '_')   p[cbit_word   + i/8] |= 1 << (i&7);
         if (isspace(i)) p[cbit_space  + i/8] |= 1 << (i&7);
         if (isxdigit(i))p[cbit_xdigit + i/8] |= 1 << (i&7);
         if (isgraph(i)) p[cbit_graph  + i/8] |= 1 << (i&7);
         if (isprint(i)) p[cbit_print  + i/8] |= 1 << (i&7);
         if (ispunct(i)) p[cbit_punct  + i/8] |= 1 << (i&7);
         if (iscntrl(i)) p[cbit_cntrl  + i/8] |= 1 << (i&7);
0c532ca4
     }
0223e6a6
     p += cbit_length;
     
     /* Finally, the character type table. In this, we exclude VT from the white
      space chars, because Perl doesn't recognize it as such for \s and for comments
      within regexes. */
     
     for (i = 0; i < 256; i++)
0c532ca4
     {
0223e6a6
         int x = 0;
         if (i != 0x0b && isspace(i)) x += ctype_space;
         if (isalpha(i)) x += ctype_letter;
         if (isdigit(i)) x += ctype_digit;
         if (isxdigit(i)) x += ctype_xdigit;
         if (isalnum(i) || i == '_') x += ctype_word;
         if (strchr("*+?{^.$|()[", i) != 0) x += ctype_meta;
         *p++ = x;
0c532ca4
     }
0223e6a6
     
     return yield;
0c532ca4
 }
 
 /* End of maketables.c */