tinypy: added re and random modules, not adapted for Kolibri yet.

git-svn-id: svn://kolibrios.org@2043 a494cfbc-eb01-0410-851d-a64ba20cac60
2011-08-08 11:24:49 +00:00 · 2011-08-08 11:24:49 +00:00 · 6c55e4b3c3
commit 6c55e4b3c3
parent 3653a07ac3
8 changed files with 5344 additions and 0 deletions
--- a/programs/develop/tinypy/modules/random/init.c
+++ b/programs/develop/tinypy/modules/random/init.c
@ -0,0 +1,52 @@
+#include "random.c"
+
+/*
+ * random_mod_init()
+ *
+ * random module initialization function
+ */
+void random_init(TP)
+{
+    /*
+     * module dict for random
+     */
+    tp_obj random_mod = tp_dict(tp);
+
+    /*
+     * bind functions to random module
+     */
+    tp_set(tp, random_mod, tp_string("seed"),       tp_fnc(tp, random_seed));
+    tp_set(tp, random_mod, tp_string("getstate"),   tp_fnc(tp, random_getstate));
+    tp_set(tp, random_mod, tp_string("setstate"),   tp_fnc(tp, random_setstate));
+    tp_set(tp, random_mod, tp_string("jumpahead"),  tp_fnc(tp, random_jumpahead));
+    tp_set(tp, random_mod, tp_string("random"),     tp_fnc(tp, random_random));
+
+    /*
+     * bind usual distribution random variable generator
+     */
+    tp_set(tp, random_mod, tp_string("uniform"),        tp_fnc(tp, random_uniform));
+    tp_set(tp, random_mod, tp_string("normalvariate"),  tp_fnc(tp, random_normalvariate));
+    tp_set(tp, random_mod, tp_string("lognormvariate"), tp_fnc(tp, random_lognormvariate));
+    tp_set(tp, random_mod, tp_string("expovariate"),    tp_fnc(tp, random_expovariate));
+    tp_set(tp, random_mod, tp_string("vonmisesvariate"), tp_fnc(tp, random_vonmisesvariate));
+    tp_set(tp, random_mod, tp_string("gammavariate"),   tp_fnc(tp, random_gammavariate));
+    tp_set(tp, random_mod, tp_string("betavariate"),    tp_fnc(tp, random_betavariate));
+    tp_set(tp, random_mod, tp_string("paretovariate"),  tp_fnc(tp, random_paretovariate));
+    tp_set(tp, random_mod, tp_string("weibullvariate"), tp_fnc(tp, random_weibullvariate));
+    tp_set(tp, random_mod, tp_string("randrange"),      tp_fnc(tp, random_randrange));
+    tp_set(tp, random_mod, tp_string("randint"),        tp_fnc(tp, random_randint));
+    tp_set(tp, random_mod, tp_string("choice"),         tp_fnc(tp, random_choice));
+    tp_set(tp, random_mod, tp_string("shuffle"),        tp_fnc(tp, random_shuffle));
+
+    /*
+     * bind special attributes to random module
+     */
+    tp_set(tp, random_mod, tp_string("__doc__"),  tp_string("Random variable generators."));
+    tp_set(tp, random_mod, tp_string("__name__"), tp_string("random"));
+    tp_set(tp, random_mod, tp_string("__file__"), tp_string(__FILE__));
+
+    /*
+     * bind random module to tinypy modules[]
+     */
+    tp_set(tp, tp->modules, tp_string("random"), random_mod);
+}
--- a/programs/develop/tinypy/modules/random/random.c
+++ b/programs/develop/tinypy/modules/random/random.c
--- a/programs/develop/tinypy/modules/random/tests.py
+++ b/programs/develop/tinypy/modules/random/tests.py
@ -0,0 +1,176 @@
+#!/usr/bin/env python
+
+import random
+#from math import log, exp, sqrt, pi
+
+def test_seed_state():
+    """test seed() and getstate()/setstate()
+    """
+    # random ought to be able to deal with seeds in any form, of follows.
+    # following code shouldn't cause an exception.
+    random.seed()
+    random.seed(0)
+    random.seed(-1)
+    random.seed(0.1)
+    random.seed(-0.1)
+    random.seed("a")
+    random.seed("abc")
+    random.seed("abcd")
+    random.seed("fasdfasdfasdfadgaldhgldahlgahdlghadlgladh")
+    random.seed("lxhlh90yowhldshlgah;")
+    
+    # state1 and state2 should be different for different seeds
+    random.seed(1)
+    state1 = random.getstate()
+    random.seed(2)
+    state2 = random.getstate()
+    rep = 0
+    for ind in range(len(state1)):
+        elem1 = state1[ind]
+        elem2 = state2[ind]
+        if (elem1 == elem2): rep += 1
+    if (rep > len(state1) / 2):
+        print("rep = ", rep, "len(state1) = ", len(state1))
+        raise "state1 and state2 should be different"
+    
+    # for the same seeds, state1 and state2 should be the same
+    random.seed(100)
+    state1 = random.getstate()
+    random.seed(100)
+    state2 = random.getstate()
+    rep = 0
+    for ind in range(len(state1)):
+        elem1 = state1[ind]
+        elem2 = state2[ind]
+        if (elem1 == elem2): rep += 1
+    if (rep != len(state1)):
+        raise "state1 and state2 should be the same"
+
+def test_jumpahead():
+    """jumpahead will change the pseudo-number generator's internal state
+    """
+    random.seed()
+    state1 = random.getstate()
+    random.jumpahead(20)
+    state2 = random.getstate()
+    rep = 0
+    for ind in range(len(state1)):
+        elem1 = state1[ind]
+        elem2 = state2[ind]
+        if (elem1 == elem2): rep += 1
+    if (rep > len(state1) / 2):
+        raise "state1 and state2 can't be the same"
+        
+def test_setstate():
+    """
+    """
+    random.seed()
+    oldState = random.getstate()
+    oldRandSeq = [random.random() for i in range(10)]
+    random.setstate(oldState)
+    newRandSeq = [random.random() for i in range(10)]
+    rep = 0
+    for ind in range(len(oldRandSeq)):
+        elem1 = oldRandSeq[ind]
+        elem2 = newRandSeq[ind]
+        if (elem1 == elem2): rep += 1
+    if (rep != len(oldRandSeq)):
+        raise "oldRandSeq and newRandSeq should be the same"
+
+def test_random():
+    """generate a random number list
+    """
+    x = [random.random() for i in range(100)]
+    
+def test_distribution():
+    """these lines are borrowed from python, they shouldn't
+        cause any exception.
+    """
+    g = random
+    g.uniform(1,10)
+    g.paretovariate(1.0)
+    g.expovariate(1.0)
+    g.weibullvariate(1.0, 1.0)
+    g.normalvariate(0.0, 1.0)
+    g.lognormvariate(0.0, 1.0)
+    g.vonmisesvariate(0.0, 1.0)
+    g.gammavariate(0.01, 1.0)
+    g.gammavariate(1.0, 1.0)
+    g.gammavariate(200.0, 1.0)
+    g.betavariate(3.0, 3.0)
+
+def test_randrange():
+    """these input to randrange() shouldn't cause any exception.
+    """
+    random.randrange(100000)
+    random.randrange(-100000)
+    random.randrange(0)
+    random.randrange(-10.2)
+    
+    random.randrange(-10, 10)
+    random.randrange(2, 1000)
+    random.randrange(0, 1)
+    random.randrange(-1, 0)
+    
+    random.randrange(10, 2000, 2)
+    random.randrange(-2000, 100, 5)
+    random.randrange(-1000.3, 1000.7, 2)
+
+def test_randint():
+    """for any valid pair (a, b), randint(a, b) should lay between [a, b]
+    """
+    for i in range(1000):
+        r = random.randint(-10000, 10000)
+        if (-10000 <= r <= 10000): continue
+        else: raise "error: random.randint()"
+
+def test_choice():
+    """random.choice() should be able to deal with string, list.
+    """
+    S = "abcdefg123*@#$%)("
+    L = [1, 2, 3, -1, 0.2, -0.1, -10000, "cyc"]
+    
+    if random.choice(S) not in S:
+        raise "error: random.choice(S)"
+    
+    if random.choice(L) not in L:
+        raise "error: random.choice(L)"
+
+def test_shuffle():
+    """test random.shuffle() on list. since string is not writable in-place,
+        random.shuffle() can not be applied on string.
+        Note: to copy items from a list to a new list, must use syntax like:
+            newList = oldList[:]
+        if use syntax like: newList = oldList, newList is just an alias of oldList.
+    """
+    oldL = [1, 2, 3, -1, 0.2, -0.1, -10000, "cyc"]
+    newL = oldL[:]
+    
+    random.shuffle(newL)
+    
+    rep = 0
+    for ind in range(len(oldL)):
+        elem1 = oldL[ind]
+        elem2 = newL[ind]
+        if (elem1 == elem2): rep += 1
+    if (rep > len(oldL) / 2):
+        raise "oldL and newL shouldn't be the same"
+        
+def test_53_bits_per_float():
+    pass
+        
+def main():
+    test_seed_state()
+    test_jumpahead()
+    test_setstate()
+    test_random()
+    test_distribution()
+    test_randrange()
+    test_randint()
+    test_choice()
+    test_shuffle()
+    test_53_bits_per_float()
+    print("#OK")
+
+if __name__ == '__main__':
+    main()
--- a/programs/develop/tinypy/modules/re/init.c
+++ b/programs/develop/tinypy/modules/re/init.c
@ -0,0 +1,710 @@
+/*
+ * regular expression module
+ *
+ * Important Note: do not support group name index
+ *
+ * $Id$
+ */
+
+#include <stdio.h>
+#include <assert.h>
+#include "regexpr.c"
+
+/* tinypy API to be use in this unit */
+extern tp_obj tp_data(TP,int magic,void *v);
+extern tp_obj tp_object_new(TP);
+extern tp_obj tp_object(TP);
+extern tp_obj tp_method(TP,tp_obj self,tp_obj v(TP));
+extern tp_obj tp_string_copy(TP, const char *s, int n);
+extern tp_obj tp_list(TP);
+extern tp_obj tp_copy(TP);
+
+/* last error message */
+static const char * LastError = NULL;
+
+/* lower level regex object */
+typedef struct {
+	struct re_pattern_buffer re_patbuf;	/* The compiled expression */
+	struct re_registers re_regs; 		/* The registers from the last match */
+	char re_fastmap[256];				/* Storage for fastmap */
+	unsigned char *re_translate;		/* String object for translate table */
+	unsigned char *re_lastok;			/* String object last matched/searched */
+
+	/* supplementary */
+	int re_errno;						/* error num */
+	int re_syntax;						/* syntax */
+} regexobject;
+
+/* local declarations */
+static regexobject* getre(TP, tp_obj rmobj);
+static tp_obj match_obj_group(TP);
+static tp_obj match_obj_groups(TP);
+static tp_obj match_obj_start(TP);
+static tp_obj match_obj_end(TP);
+static tp_obj match_obj_span(TP);
+
+/*
+ * helper function: return lower level regex object
+ * rmobj	- regex or match object
+ */
+static regexobject * getre(TP, tp_obj rmobj)
+{
+	tp_obj reobj_data = tp_get(tp, rmobj, tp_string("__data__"));
+	regexobject *re = NULL;
+
+	/* validate magic */
+	if (reobj_data.data.magic != sizeof(regexobject)) {
+		LastError = "broken regex object";
+		return (NULL);
+	}
+	re = (regexobject*)reobj_data.data.val;
+	assert(re);
+
+	return (re);
+}
+
+/*
+ * derive match object from regex object
+ */
+static tp_obj match_object(TP, tp_obj reobj)
+{
+	tp_obj mo = tp_object(tp);	/* match object */
+	tp_obj redata;				/* regex object data */
+	tp_obj madata;				/* match object data */
+	regexobject *re = NULL;		/* lower level regex object */
+
+	redata = tp_get(tp, reobj, tp_string("__data__"));
+	re = (regexobject *)redata.data.val;
+	assert(re);
+	madata = tp_data(tp, (int)sizeof(regexobject), re);
+
+	tp_set(tp, mo, tp_string("group"),	tp_method(tp, mo, match_obj_group));
+	tp_set(tp, mo, tp_string("groups"),	tp_method(tp, mo, match_obj_groups));
+	tp_set(tp, mo, tp_string("start"),	tp_method(tp, mo, match_obj_start));
+	tp_set(tp, mo, tp_string("end"),	tp_method(tp, mo, match_obj_end));
+	tp_set(tp, mo, tp_string("span"),	tp_method(tp, mo, match_obj_span));
+	tp_set(tp, mo, tp_string("__data__"), madata);
+
+	return (mo);
+}
+
+/*
+ * FUNC: regexobj.search(str[,pos=0])
+ * self		- regex object
+ * str		- string to be searched
+ * pos		- optional starting offset
+ *
+ * RETURN:
+ * match object	- when matched
+ * None			- not matched
+ */
+static tp_obj regex_obj_search(TP)
+{
+	tp_obj self = TP_OBJ();		/* regex object */
+	tp_obj str = TP_STR();
+	tp_obj pos = TP_DEFAULT(tp_number(0));
+	tp_obj maobj;				/* match object */
+	regexobject *re = NULL;
+	int r = -2;					/* -2 indicate exception */
+	int range;
+
+	if (pos.number.val < 0 || pos.number.val > str.string.len) {
+		LastError = "search offset out of range";
+		goto exception;
+	}
+	range = str.string.len - pos.number.val;
+
+	re = getre(tp, self);
+	re->re_lastok = NULL;
+	r = re_search(&re->re_patbuf, (unsigned char *)str.string.val, 
+			str.string.len, pos.number.val, range, &re->re_regs);
+
+	/* cannot match pattern */
+	if (r == -1)
+		goto notfind;
+
+	/* error occurred */
+	if (r == -2)
+		goto exception;
+
+	/* matched */
+	re->re_lastok = (unsigned char *)str.string.val;
+
+	/* match obj */
+	maobj = match_object(tp, self);
+
+	return (maobj);	
+
+notfind:
+	re->re_lastok = NULL;
+	return (tp_None);
+exception:
+	re->re_lastok = NULL;
+	tp_raise(tp_None, tp_string("regex search error"));
+}
+
+/*
+ * FUNC: regexobj.match(str[,pos=0])
+ * self		- regex object
+ * str		- string to be matched
+ * pos		- optional starting position
+ *
+ * RETURN:
+ * match object	- when matched
+ * None			- not matched
+ */
+static tp_obj regex_obj_match(TP)
+{
+	tp_obj self = TP_OBJ();		/* regex object */
+	tp_obj str = TP_STR();
+	tp_obj pos = TP_DEFAULT(tp_number(0));
+	tp_obj maobj;				/* match object */
+	regexobject *re = NULL;
+	int r = -2;					/* -2 indicate exception */
+
+	re = getre(tp, self);
+	re->re_lastok = NULL;
+	r = re_match(&re->re_patbuf, (unsigned char *)str.string.val, 
+			str.string.len, pos.number.val, &re->re_regs);
+
+	/* cannot match pattern */
+	if (r == -1)
+		goto nomatch;
+
+	/* error occurred */
+	if (r == -2)
+		goto exception;
+
+	/* matched */
+	re->re_lastok = (unsigned char *)str.string.val;
+
+	/* match obj */
+	maobj = match_object(tp, self);
+
+	return (maobj);	
+
+nomatch:
+	re->re_lastok = NULL;
+	return (tp_None);
+exception:
+	re->re_lastok = NULL;
+	tp_raise(tp_None, tp_string("regex match error"));
+}
+
+/*
+ * regex object split()
+ * self		- regex object
+ * restr	- regex string
+ * maxsplit	- max split field, default 0, mean no limit
+ */
+static tp_obj regex_obj_split(TP)
+{
+	tp_obj self		= TP_OBJ();	/* regex object */
+	tp_obj restr	= TP_OBJ();	/* string */
+	tp_obj maxsplit = TP_DEFAULT(tp_number(0));
+	tp_obj maobj;				/* match object */
+	regexobject *re = NULL;		/* lower level regex object */
+	tp_obj result	= tp_list(tp);
+	tp_obj grpstr;				/* group string */
+	int	slen;					/* string length */
+	int srchloc;				/* search location */
+
+	/* maxsplit == 0 means no limit */
+	if ((int)maxsplit.number.val == 0)
+		maxsplit.number.val = RE_NREGS;
+	assert(maxsplit.number.val > 0);
+
+	srchloc = 0;
+	slen = strlen((char *)restr.string.val);
+
+	do {
+		/* generate a temp match object */
+		tp_params_v(tp, 3, self, restr, tp_number(srchloc));
+		maobj = regex_obj_search(tp);
+		if (!tp_bool(tp, maobj)) 
+			break;
+
+		re = getre(tp, maobj);
+		if (re->re_lastok == NULL) {
+			tp_raise(tp_None, tp_string("no match for split()"));
+		}
+
+		/* extract fields */
+		if ((int)maxsplit.number.val > 0) {
+			int start = re->re_regs.start[0];
+			int end   = re->re_regs.end[0];
+			/*printf("%s:start(%d),end(%d)\n", __func__, start, end);*/
+			if (start < 0 || end < 0)
+				break;
+
+			grpstr = tp_string_copy(tp, 
+					(const char *)re->re_lastok + srchloc, start - srchloc);
+
+			if (tp_bool(tp, grpstr)) {
+				tp_set(tp, result, tp_None, grpstr);
+				maxsplit.number.val--;
+			}
+
+			srchloc = end;
+		}
+	} while (srchloc < slen && (int)maxsplit.number.val > 0);
+
+	/* collect remaining string, if necessary */
+	if (srchloc < slen) {
+		grpstr = tp_string_copy(tp, 
+				(const char *)restr.string.val + srchloc, slen - srchloc);
+		if (tp_bool(tp, grpstr))
+			tp_set(tp, result, tp_None, grpstr);
+	}
+
+	return (result);
+}
+
+/*
+ * regex object findall()
+ * self		- regex object
+ * restr	- regex string
+ * pos		- starting position, default 0
+ */
+static tp_obj regex_obj_findall(TP)
+{
+	tp_obj self		= TP_OBJ();	/* regex object */
+	tp_obj restr	= TP_OBJ();	/* string */
+	tp_obj pos		= TP_DEFAULT(tp_number(0));
+	tp_obj maobj;				/* match object */
+	regexobject *re = NULL;		/* lower level regex object */
+	tp_obj result	= tp_list(tp);
+	tp_obj grpstr;				/* group string */
+	int	slen;					/* string length */
+	int srchloc;				/* search location */
+
+	srchloc = (int)pos.number.val;
+	slen	= strlen((char *)restr.string.val);
+	if (srchloc < 0 || srchloc >= slen)
+		tp_raise(tp_None, tp_string("starting position out of range"));
+
+	do {
+		/* generate a temp match object */
+		tp_params_v(tp, 3, self, restr, tp_number(srchloc));
+		maobj = regex_obj_search(tp);
+		if (!tp_bool(tp, maobj)) 
+			break;
+
+		re = getre(tp, maobj);
+		if (re->re_lastok == NULL) {
+			tp_raise(tp_None, tp_string("no match for findall()"));
+		}
+
+		/* extract fields */
+		if (srchloc < slen) {
+			int start = re->re_regs.start[0];
+			int end   = re->re_regs.end[0];
+			/*printf("%s:start(%d),end(%d)\n", __func__, start, end);*/
+			if (start < 0 || end < 0)
+				break;
+
+			grpstr = tp_string_copy(tp, 
+					(const char *)re->re_lastok + start, end - start);
+
+			if (tp_bool(tp, grpstr)) {
+				tp_set(tp, result, tp_None, grpstr);
+			}
+
+			srchloc = end;
+		}
+	} while (srchloc < slen);
+
+	return (result);
+}
+
+/*
+ * FUNC: matchobj.group([group1, ...])
+ * self		- match object
+ * args		- optional group indices, default 0
+ *
+ * return specified group.
+ */
+static tp_obj match_obj_group(TP)
+{
+	tp_obj self = TP_OBJ();		/* match object */
+	tp_obj grpidx;				/* a group index */
+	regexobject *re = NULL;
+	int indices[RE_NREGS];
+	int start;
+	int end;
+	int i;
+	int single = 0;				/* single group index? */
+	tp_obj result;
+
+	/* get lower level regex object representation */
+	re = getre(tp, self);
+	if (re->re_lastok == NULL)
+		tp_raise(tp_None, 
+				tp_string("group() only valid after successful match/search"));
+
+	for (i = 0; i < RE_NREGS; i++)
+		indices[i] = -1;
+
+	/*
+	 * if no group index provided, supply default group index 0; else
+	 * fill in indices[] with provided group index list.
+	 */
+	if (tp->params.list.val->len == 0) {
+		indices[0] = 0;
+		single = 1;
+	} else if (tp->params.list.val->len == 1) {
+		indices[0] = (int)TP_NUM();
+		single = 1;
+	} else {
+		i = 0;
+		TP_LOOP(grpidx)
+		if (grpidx.number.val < 0 || grpidx.number.val > RE_NREGS)
+			tp_raise(tp_None, tp_string("group() grpidx out of range"));
+		indices[i++] = (int)grpidx.number.val;
+		TP_END
+	}
+
+	/* generate result string list */
+	result = tp_list(tp);
+	for (i = 0; i < RE_NREGS && indices[i] >= 0; i++) {
+		tp_obj grpstr;
+		start = re->re_regs.start[indices[i]];
+		end   = re->re_regs.end[indices[i]];
+		if (start < 0 || end < 0) {
+			grpstr = tp_None;
+		} else {
+			grpstr = tp_string_copy(tp, (const char *)re->re_lastok + start, 
+					end - start);
+		}
+		tp_set(tp, result, tp_None, grpstr);
+	}
+	return (single ? tp_get(tp, result, tp_number(0)) : result);
+}
+
+/*
+ * FUNC: matchobj.groups()
+ * self	- match object.
+ * return all groups.
+ * Note: CPython allow a 'default' argument, but we disallow it.
+ */
+static tp_obj match_obj_groups(TP)
+{
+	tp_obj self = TP_OBJ();		/* match object */
+	regexobject *re = NULL;
+	int start;
+	int end;
+	int i;
+	tp_obj result = tp_list(tp);
+
+	re = getre(tp, self);
+	if (re->re_lastok == NULL) {
+		tp_raise(tp_None, 
+				tp_string("groups() only valid after successful match/search"));
+	}
+
+	for (i = 1; i < RE_NREGS; i++) {
+		start = re->re_regs.start[i];
+		end   = re->re_regs.end[i];
+		if (start < 0 || end < 0)
+			break;
+
+		tp_obj grpstr = tp_string_copy(tp, 
+				(const char *)re->re_lastok + start, end - start);
+
+		if (tp_bool(tp, grpstr))
+			tp_set(tp, result, tp_None, grpstr);
+	}
+
+	return (result);
+}
+
+/*
+ * FUNC: matchobj.start([group])
+ * self		- match object
+ * group	- group index
+ * return starting position of matched 'group' substring.
+ */
+static tp_obj match_obj_start(TP)
+{
+	tp_obj self = TP_OBJ();						/* match object */
+	tp_obj group = TP_DEFAULT(tp_number(0));	/* group */
+	regexobject *re = NULL;
+	int start;
+
+	re = getre(tp, self);
+	if (re->re_lastok == NULL) {
+		tp_raise(tp_None, 
+				tp_string("start() only valid after successful match/search"));
+	}
+
+	if (group.number.val < 0 || group.number.val > RE_NREGS)
+		tp_raise(tp_None, tp_string("IndexError: group index out of range"));
+
+	start = re->re_regs.start[(int)group.number.val];
+
+	return (tp_number(start));
+}
+
+/*
+ * FUNC: matchobj.end([group])
+ * self		- match object
+ * group	- group index
+ * return ending position of matched 'group' substring.
+ */
+static tp_obj match_obj_end(TP)
+{
+	tp_obj self = TP_OBJ();						/* match object */
+	tp_obj group = TP_DEFAULT(tp_number(0));	/* group */
+	regexobject *re = NULL;
+	int end;
+
+	re = getre(tp, self);
+	if (re->re_lastok == NULL) {
+		tp_raise(tp_None, 
+				tp_string("end() only valid after successful match/search"));
+	}
+
+	if (group.number.val < 0 || group.number.val > RE_NREGS)
+		tp_raise(tp_None, tp_string("IndexError: group index out of range"));
+
+	end = re->re_regs.end[(int)group.number.val];
+
+	return (tp_number(end));
+}
+
+/*
+ * FUNC: matchobj.span([group])
+ * self		- match object
+ * group	- group index
+ * return [start,end] position pair of matched 'group' substring.
+ */
+static tp_obj match_obj_span(TP)
+{
+	tp_obj self = TP_OBJ();						/* match object */
+	tp_obj group = TP_DEFAULT(tp_number(0));	/* group */
+	regexobject *re = NULL;
+	int start;
+	int end;
+	tp_obj result;
+
+	re = getre(tp, self);
+	if (re->re_lastok == NULL) {
+		tp_raise(tp_None, 
+				tp_string("span() only valid after successful match/search"));
+	}
+
+	if (group.number.val < 0 || group.number.val > RE_NREGS)
+		tp_raise(tp_None, tp_string("IndexError: group index out of range"));
+
+	start = re->re_regs.start[(int)group.number.val];
+	end   = re->re_regs.end[(int)group.number.val];
+
+	result = tp_list(tp);
+	tp_set(tp, result, tp_None, tp_number(start));
+	tp_set(tp, result, tp_None, tp_number(end));
+
+	return (result);
+}
+
+/*
+ * compile out a re object
+ * repat	- regex pattern
+ * resyn	- regex syntax
+ */
+static tp_obj regex_compile(TP)
+{
+	char *error = NULL;
+	char const *pat = NULL;
+	int size = 0;
+	tp_obj reobj_data;
+	tp_obj repat = TP_TYPE(TP_STRING);						/* pattern */
+	tp_obj resyn = TP_DEFAULT(tp_number(RE_SYNTAX_EMACS));	/* syntax */
+	tp_obj reobj;	/* regex object */
+	regexobject *re;
+
+	/*
+	 * create regex object, its parent is builtin 'object'
+	 */
+	reobj = tp_object(tp);
+
+	re = (regexobject *)malloc(sizeof(regexobject));
+	if (!re) {
+		error = "malloc lower level regex object failed";
+		goto finally;
+	}
+
+	re->re_patbuf.buffer = NULL;
+	re->re_patbuf.allocated = 0;
+	re->re_patbuf.fastmap = (unsigned char *)re->re_fastmap;
+	re->re_patbuf.translate = NULL;
+	re->re_translate = NULL;
+	re->re_lastok = NULL;
+
+	re->re_errno = 0;
+	re->re_syntax = (int)resyn.number.val;
+
+	pat = repat.string.val;
+	size = repat.string.len;
+	error = re_compile_pattern((unsigned char *)pat, size, &re->re_patbuf);
+	if (error != NULL) {
+		LastError = error;
+		goto finally;
+	}
+
+	/* regexobject's size as magic */
+	reobj_data = tp_data(tp, (int)sizeof(regexobject), re);
+
+	/*
+	 * bind to regex object
+	 */
+	tp_set(tp, reobj, tp_string("search"), 
+			tp_method(tp, reobj, regex_obj_search));
+	tp_set(tp, reobj, tp_string("match"), 
+			tp_method(tp, reobj, regex_obj_match));
+	tp_set(tp, reobj, tp_string("split"),
+			tp_method(tp, reobj, regex_obj_split));
+	tp_set(tp, reobj, tp_string("findall"),
+			tp_method(tp, reobj, regex_obj_findall));
+	tp_set(tp, reobj, tp_string("__data__"), reobj_data);
+
+	tp_set(tp, reobj, tp_string("__name__"), 
+			tp_string("regular expression object"));
+	tp_set(tp, reobj, tp_string("__doc__"), tp_string(
+				"regular expression object, support methods:\n"
+				"search(str[,pos=0])-search 'str' from 'pos'\n"
+				"match(str[,pos=0])	-match 'str' from 'pos'\n"
+				));
+
+	return (reobj);
+
+finally:
+	tp_raise(tp_None, tp_string(error));
+}
+
+/*
+ * module level search()
+ */
+static tp_obj regex_search(TP)
+{
+	tp_obj repat = TP_OBJ();	/* pattern */
+	tp_obj restr = TP_OBJ();	/* string */
+	tp_obj resyn = TP_DEFAULT(tp_number(RE_SYNTAX_EMACS));
+	tp_obj reobj;				/* regex object */
+	tp_obj maobj;				/* match object */
+
+	/* compile out regex object */
+	tp_params_v(tp, 2, repat, resyn);
+	reobj = regex_compile(tp);
+	
+	/* call r.search() */
+	tp_params_v(tp, 3, reobj, restr, tp_number(0));
+	maobj = regex_obj_search(tp);
+
+	return (maobj);
+}
+
+/*
+ * module level match()
+ */
+static tp_obj regex_match(TP)
+{
+	tp_obj repat = TP_OBJ();	/* pattern */
+	tp_obj restr = TP_OBJ();	/* string */
+	tp_obj resyn = TP_DEFAULT(tp_number(RE_SYNTAX_EMACS));
+	tp_obj reobj;				/* regex object */
+	tp_obj maobj;				/* match object */
+
+	/* compile out regex object */
+	tp_params_v(tp, 2, repat, resyn);
+	reobj = regex_compile(tp);
+	
+	/* call r.search() */
+	tp_params_v(tp, 3, reobj, restr, tp_number(0));
+	maobj = regex_obj_match(tp);
+
+	return (maobj);
+}
+
+/*
+ * module level split()
+ * repat	- regex pattern
+ * restr	- regex string
+ * maxsplit	- max split field, default 0, mean no limit
+ */
+static tp_obj regex_split(TP)
+{
+	tp_obj repat = TP_OBJ();	/* pattern */
+	tp_obj restr = TP_OBJ();	/* string */
+	tp_obj maxsplit = TP_DEFAULT(tp_number(0));
+	tp_obj reobj;				/* regex object */
+
+	/* generate a temp regex object */
+	tp_params_v(tp, 2, repat, tp_number(RE_SYNTAX_EMACS));
+	reobj = regex_compile(tp);
+	
+	tp_params_v(tp, 3, reobj, restr, maxsplit);
+	return regex_obj_split(tp);
+}
+
+/*
+ * module level findall()
+ * repat	- regex pattern
+ * restr	- regex string
+ * resyn	- regex syntax, optional, default RE_SYNTAX_EMAC
+ */
+static tp_obj regex_findall(TP)
+{
+	tp_obj repat = TP_OBJ();	/* pattern */
+	tp_obj restr = TP_OBJ();	/* string */
+	tp_obj resyn = TP_DEFAULT(tp_number(RE_SYNTAX_EMACS));
+	tp_obj reobj;				/* regex object */
+
+	/* generate a temp regex object */
+	tp_params_v(tp, 2, repat, resyn);
+	reobj = regex_compile(tp);
+	
+	tp_params_v(tp, 2, reobj, restr);
+	return regex_obj_findall(tp);
+}
+
+
+/*
+ * re mod can only support 'set_syntax', 'get_syntax', and 'compile' functions,
+ * 'compile' function will return a 'reobj', and this 'reobj' will support
+ * methods 'search', 'match', 'group', 'groupall', el al.
+ */
+void re_init(TP)
+{
+	/*
+	 * module dict for re
+	 */
+	tp_obj re_mod = tp_dict(tp);
+
+	/*
+	 * bind to re module
+	 */
+	tp_set(tp, re_mod, tp_string("compile"),	  tp_fnc(tp, regex_compile));
+	tp_set(tp, re_mod, tp_string("search"),		  tp_fnc(tp, regex_search));
+	tp_set(tp, re_mod, tp_string("match"),		  tp_fnc(tp, regex_match));
+	tp_set(tp, re_mod, tp_string("split"),		  tp_fnc(tp, regex_split));
+	tp_set(tp, re_mod, tp_string("findall"),	  tp_fnc(tp, regex_findall));
+	tp_set(tp, re_mod, tp_string("AWK_SYNTAX"),   tp_number(RE_SYNTAX_AWK));
+	tp_set(tp, re_mod, tp_string("EGREP_SYNTAX"), tp_number(RE_SYNTAX_EGREP));
+	tp_set(tp, re_mod, tp_string("GREP_SYNTAX"),  tp_number(RE_SYNTAX_GREP));
+	tp_set(tp, re_mod, tp_string("EMACS_SYNTAX"), tp_number(RE_SYNTAX_EMACS));
+
+	/*
+	 * bind special attibutes to re module
+	 */
+	tp_set(tp, re_mod, tp_string("__name__"), 
+			tp_string("regular expression module"));
+	tp_set(tp, re_mod, tp_string("__file__"), tp_string(__FILE__));
+	tp_set(tp, re_mod, tp_string("__doc__"), 
+			tp_string("simple regular express implementation"));
+
+	/*
+	 * bind regex module to tinypy modules[]
+	 */
+	tp_set(tp, tp->modules, tp_string("re"), re_mod);
+}
+
--- a/programs/develop/tinypy/modules/re/regexpr.c
+++ b/programs/develop/tinypy/modules/re/regexpr.c
--- a/programs/develop/tinypy/modules/re/regexpr.h
+++ b/programs/develop/tinypy/modules/re/regexpr.h
@ -0,0 +1,160 @@
+/*
+ * -*- mode: c-mode; c-file-style: python -*-
+ */
+
+#ifndef Py_REGEXPR_H
+#define Py_REGEXPR_H
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+/*
+ * regexpr.h
+ *
+ * Author: Tatu Ylonen <ylo@ngs.fi>
+ *
+ * Copyright (c) 1991 Tatu Ylonen, Espoo, Finland
+ *
+ * Permission to use, copy, modify, distribute, and sell this software
+ * and its documentation for any purpose is hereby granted without fee,
+ * provided that the above copyright notice appear in all copies.  This
+ * software is provided "as is" without express or implied warranty.
+ *
+ * Created: Thu Sep 26 17:15:36 1991 ylo
+ * Last modified: Mon Nov  4 15:49:46 1991 ylo
+ */
+
+/* $Id$ */
+
+#ifndef REGEXPR_H
+#define REGEXPR_H
+
+#define RE_NREGS	100  /* number of registers available */
+
+typedef struct re_pattern_buffer
+{
+	unsigned char *buffer;          /* compiled pattern */
+	int allocated;         /* allocated size of compiled pattern */
+	int used;              /* actual length of compiled pattern */
+	unsigned char *fastmap;         /* fastmap[ch] is true if ch can start pattern */
+	unsigned char *translate;       /* translation to apply during compilation/matching */
+	unsigned char fastmap_accurate; /* true if fastmap is valid */
+	unsigned char can_be_null;      /* true if can match empty string */
+	unsigned char uses_registers;   /* registers are used and need to be initialized */
+	int num_registers;     /* number of registers used */
+	unsigned char anchor;           /* anchor: 0=none 1=begline 2=begbuf */
+} *regexp_t;
+
+typedef struct re_registers
+{
+	int start[RE_NREGS];  /* start offset of region */
+	int end[RE_NREGS];    /* end offset of region */
+} *regexp_registers_t;
+
+/* bit definitions for syntax */
+#define RE_NO_BK_PARENS		1    /* no quoting for parentheses */
+#define RE_NO_BK_VBAR		2    /* no quoting for vertical bar */
+#define RE_BK_PLUS_QM		4    /* quoting needed for + and ? */
+#define RE_TIGHT_VBAR		8    /* | binds tighter than ^ and $ */
+#define RE_NEWLINE_OR		16   /* treat newline as or */
+#define RE_CONTEXT_INDEP_OPS	32   /* ^$?*+ are special in all contexts */
+#define RE_ANSI_HEX		64   /* ansi sequences (\n etc) and \xhh */
+#define RE_NO_GNU_EXTENSIONS   128   /* no gnu extensions */
+
+#define TP_RE_NOERR             0
+#define TP_RE_UNKNOWN_OPCODE    (-1)
+#define TP_RE_JUMP_OUT_BOUNDS   1
+#define TP_RE_QUOTE_ERR         2
+
+/* definitions for some common regexp styles */
+#define RE_SYNTAX_AWK	(RE_NO_BK_PARENS|RE_NO_BK_VBAR|RE_CONTEXT_INDEP_OPS)
+#define RE_SYNTAX_EGREP	(RE_SYNTAX_AWK|RE_NEWLINE_OR)
+#define RE_SYNTAX_GREP	(RE_BK_PLUS_QM|RE_NEWLINE_OR)
+#define RE_SYNTAX_EMACS	0
+
+#define Sword       1
+#define Swhitespace 2
+#define Sdigit      4
+#define Soctaldigit 8
+#define Shexdigit   16
+
+/* Rename all exported symbols to avoid conflicts with similarly named
+   symbols in some systems' standard C libraries... */
+
+#define re_syntax _Py_re_syntax
+#define re_syntax_table _Py_re_syntax_table
+#define re_compile_initialize _Py_re_compile_initialize
+#define re_set_syntax _Py_re_set_syntax
+#define re_compile_pattern _Py_re_compile_pattern
+#define re_match _Py_re_match
+#define re_search _Py_re_search
+#define re_compile_fastmap _Py_re_compile_fastmap
+#define re_comp _Py_re_comp
+#define re_exec _Py_re_exec
+
+#ifdef HAVE_PROTOTYPES
+
+extern int re_syntax;
+/* This is the actual syntax mask.  It was added so that Python could do
+ * syntax-dependent munging of patterns before compilation. */
+
+extern unsigned char re_syntax_table[256];
+
+void re_compile_initialize(void);
+
+int re_set_syntax(int syntax);
+/* This sets the syntax to use and returns the previous syntax.  The
+ * syntax is specified by a bit mask of the above defined bits. */
+
+char *re_compile_pattern(unsigned char *regex, int regex_size, regexp_t compiled);
+/* This compiles the regexp (given in regex and length in regex_size).
+ * This returns NULL if the regexp compiled successfully, and an error
+ * message if an error was encountered.  The buffer field must be
+ * initialized to a memory area allocated by malloc (or to NULL) before
+ * use, and the allocated field must be set to its length (or 0 if
+ * buffer is NULL).  Also, the translate field must be set to point to a
+ * valid translation table, or NULL if it is not used. */
+
+int re_match(regexp_t compiled, unsigned char *string, int size, int pos,
+	     regexp_registers_t old_regs);
+/* This tries to match the regexp against the string.  This returns the
+ * length of the matched portion, or -1 if the pattern could not be
+ * matched and -2 if an error (such as failure stack overflow) is
+ * encountered. */
+
+int re_search(regexp_t compiled, unsigned char *string, int size, int startpos,
+	      int range, regexp_registers_t regs);
+/* This searches for a substring matching the regexp.  This returns the
+ * first index at which a match is found.  range specifies at how many
+ * positions to try matching; positive values indicate searching
+ * forwards, and negative values indicate searching backwards.  mstop
+ * specifies the offset beyond which a match must not go.  This returns
+ * -1 if no match is found, and -2 if an error (such as failure stack
+ * overflow) is encountered. */
+
+void re_compile_fastmap(regexp_t compiled);
+/* This computes the fastmap for the regexp.  For this to have any effect,
+ * the calling program must have initialized the fastmap field to point
+ * to an array of 256 characters. */
+
+#else /* HAVE_PROTOTYPES */
+
+extern int re_syntax;
+extern unsigned char re_syntax_table[256];
+void re_compile_initialize();
+int re_set_syntax();
+char *re_compile_pattern();
+int re_match();
+int re_search();
+void re_compile_fastmap();
+
+#endif /* HAVE_PROTOTYPES */
+
+#endif /* REGEXPR_H */
+
+
+
+#ifdef __cplusplus
+}
+#endif
+#endif /* !Py_REGEXPR_H */
--- a/programs/develop/tinypy/modules/re/tests.py
+++ b/programs/develop/tinypy/modules/re/tests.py
@ -0,0 +1,648 @@
+"""
+test case for re module
+"""
+
+import re
+import testsuite
+SUCCEED, FAIL, SYNTAX_ERROR = range(3)
+
+def RAISE():
+    raise("testing failed")
+
+def main():
+    #print("begin re tests")
+
+    assert(re.__name__ != None)
+    assert(re.__doc__ != None)
+    assert(re.__file__ != None)
+
+    test_re_obj_search()
+    test_re_obj_match()
+    test_re_mod_search()
+    test_re_mod_match()
+    test_re_obj_split()
+    test_re_mod_split()
+    test_re_obj_findall()
+    test_re_mod_findall()
+    test_mat_obj_groups()
+    test_mat_obj_start()
+    test_mat_obj_end()
+    test_mat_obj_span()
+
+    print("#OK: re tests passed")
+
+def test_re_obj_search(verbose = None):
+    """
+    some tests borrowed from cpython
+    testing re.compile(), reobj.search(), and matobj.group()
+    """
+    regex_tests = testsuite.search_regex_tests
+    for t in regex_tests:
+        pattern=s=outcome=repl=expected=None
+        if len(t)==5:
+            pattern, s, outcome, repl, expected = t
+        elif len(t)==3:
+            pattern, s, outcome = t
+        else:
+            raise ('Test tuples should have 3 or 5 fields',t)
+
+        try:
+            obj=re.compile(pattern)
+        except:
+            if outcome==SYNTAX_ERROR: continue    # Expected a syntax error
+            else:
+                # Regex syntax errors aren't yet reported, so for
+                # the official test suite they'll be quietly ignored.
+                pass
+        try:
+            matobj=obj.search(s)
+        except:
+            print('=== Unexpected exception:', obj, matobj, pattern, s)
+            RAISE()
+
+        if outcome==SYNTAX_ERROR:
+            # This should have been a syntax error; forget it.
+            pass
+        elif outcome==FAIL:
+            if matobj==None: pass   # No match, as expected
+            else: print('=== Succeeded incorrectly', obj, matobj, pattern, s)
+        elif outcome==SUCCEED:
+            if matobj!=None:
+                # Matched, as expected, so now we compute the
+                # result string and compare it to our expected result.
+                found=matobj.group(0)
+                repl = repl.replace("found", str(found))
+                for i in range(1,11):
+                    if "g"+str(i) in repl:
+                        gi = str(matobj.group(i))
+                        repl = repl.replace("g"+str(i), gi)
+                if len(t) == 5:
+                    repl = repl.replace('+', '')
+                    repl = repl.replace('\"', '')
+                    if repl!=expected:
+                        print( '=== grouping error', t, 
+                                str(repl)+' should be '+str(expected))
+                        RAISE()
+            else:
+                print ('=== Failed incorrectly', t)
+
+def test_re_obj_match(verbose = None):
+    """
+    some tests borrowed from cpython
+    testing re.compile(), reobj.match() and matobj.group()
+    """
+    regex_tests = testsuite.match_regex_tests
+    for t in regex_tests:
+        pattern=s=outcome=repl=expected=None
+        if len(t)==5:
+            pattern, s, outcome, repl, expected = t
+        elif len(t)==3:
+            pattern, s, outcome = t
+        else:
+            raise ('Test tuples should have 3 or 5 fields',t)
+
+        try:
+            obj=re.compile(pattern)
+        except:
+            if outcome==SYNTAX_ERROR: continue    # Expected a syntax error
+            else:
+                # Regex syntax errors aren't yet reported, so for
+                # the official test suite they'll be quietly ignored.
+                pass
+        try:
+            matobj=obj.match(s)
+        except:
+            print('=== Unexpected exception:', obj, matobj, pattern, s)
+
+        if outcome==SYNTAX_ERROR:
+            # This should have been a syntax error; forget it.
+            pass
+        elif outcome==FAIL:
+            if matobj==None: pass   # No match, as expected
+            else: print('=== Succeeded incorrectly', obj, matobj, pattern, s)
+        elif outcome==SUCCEED:
+            if matobj!=None:
+                # Matched, as expected, so now we compute the
+                # result string and compare it to our expected result.
+                found=matobj.group(0)
+                repl = repl.replace("found", str(found))
+                for i in range(1,11):
+                    if "g"+str(i) in repl:
+                        gi = str(matobj.group(i))
+                        repl = repl.replace("g"+str(i), gi)
+                if len(t) == 5:
+                    repl = repl.replace('+', '')
+                    repl = repl.replace('\"', '')
+                    if repl!=expected:
+                        print( '=== grouping error', t, 
+                                str(repl)+' should be '+str(expected))
+                        RAISE()
+            else:
+                print ('=== Failed incorrectly', obj, matobj, pattern, s)
+
+def test_re_mod_search(verbose = None):
+    """
+    some tests borrowed from cpython
+    testing re.search(), and matobj.group()
+    """
+    regex_tests = testsuite.search_regex_tests
+    for t in regex_tests:
+        pattern=s=outcome=repl=expected=None
+        if len(t)==5:
+            pattern, s, outcome, repl, expected = t
+        elif len(t)==3:
+            pattern, s, outcome = t
+        else:
+            raise ('Test tuples should have 3 or 5 fields',t)
+
+        try:
+            matobj=re.search(pattern, s)
+        except:
+            if outcome==SYNTAX_ERROR:
+                # This should have been a syntax error; forget it.
+                pass
+            else:
+                print('=== Unexpected exception:', matobj, pattern, s)
+
+        if outcome==FAIL:
+            if matobj==None: pass   # No match, as expected
+            else: print('=== Succeeded incorrectly', obj, matobj, pattern, s)
+        elif outcome==SUCCEED:
+            if matobj!=None:
+                # Matched, as expected, so now we compute the
+                # result string and compare it to our expected result.
+                found=matobj.group(0)
+                repl = repl.replace("found", str(found))
+                for i in range(1,11):
+                    if "g"+str(i) in repl:
+                        gi = str(matobj.group(i))
+                        repl = repl.replace("g"+str(i), gi)
+                if len(t) == 5:
+                    repl = repl.replace('+', '')
+                    repl = repl.replace('\"', '')
+                    if repl!=expected:
+                        print( '=== grouping error', t, 
+                                str(repl)+' should be '+str(expected))
+                        RAISE()
+            else:
+                print ('=== Failed incorrectly', t)
+
+def test_re_mod_match(verbose = None):
+    """
+    some tests borrowed from cpython
+    testing re.match(), and matobj.group()
+    """
+    regex_tests = testsuite.match_regex_tests
+    for t in regex_tests:
+        pattern=s=outcome=repl=expected=None
+        if len(t)==5:
+            pattern, s, outcome, repl, expected = t
+        elif len(t)==3:
+            pattern, s, outcome = t
+        else:
+            raise ('Test tuples should have 3 or 5 fields',t)
+
+        try:
+            matobj=re.match(pattern, s)
+        except:
+            if outcome==SYNTAX_ERROR:
+                # This should have been a syntax error; forget it.
+                pass
+            else:
+                print('=== Unexpected exception:', matobj, pattern, s)
+
+        if outcome==FAIL:
+            if matobj==None: pass   # No match, as expected
+            else: print('=== Succeeded incorrectly', matobj, pattern, s)
+        elif outcome==SUCCEED:
+            if matobj!=None:
+                # Matched, as expected, so now we compute the
+                # result string and compare it to our expected result.
+                found=matobj.group(0)
+                repl = repl.replace("found", str(found))
+                for i in range(1,11):
+                    if "g"+str(i) in repl:
+                        gi = str(matobj.group(i))
+                        repl = repl.replace("g"+str(i), gi)
+                if len(t) == 5:
+                    repl = repl.replace('+', '')
+                    repl = repl.replace('\"', '')
+                    if repl!=expected:
+                        print( '=== grouping error', t, 
+                                str(repl)+' should be '+str(expected))
+                        RAISE()
+            else:
+                print ('=== Failed incorrectly', t)
+
+def test_re_obj_split(verbose = None):
+    """
+    test re.compile(), and reobj.split()
+    """
+    regex_tests = testsuite.split_regex_tests
+    for t in regex_tests:
+        pattern, s, outcome, maxsplit, fields = t
+        try:
+            reobj = re.compile(pattern)
+        except:
+            if outcome==SYNTAX_ERROR:
+                # This should have been a syntax error; forget it.
+                pass
+            else:
+                print('=== Unexpected exception:', pattern, s, 
+                                    outcome, maxsplit, fields)
+        try:
+            fldlst=reobj.split(s, maxsplit)
+        except:
+            if outcome == SYNTAX_ERROR:
+                continue
+            else:
+                print('=== Unexpected exception:', pattern, s, 
+                                    outcome, maxsplit, fields)
+
+        if outcome==FAIL:
+            pass    # No match, as expected
+        elif outcome==SUCCEED:
+            if fldlst:
+                # Matched, as expected, so now we compute the
+                # result string and compare it to our expected result.
+                if verbose:
+                    fldstr = fieldstr = ""
+                    for item in fldlst:
+                        fldstr = fldstr + str(item) + " | "
+                    for item in fields:
+                        fieldstr = fieldstr + str(item) + " | "
+                    print(fldstr, "~~~", fieldstr)
+                if len(fields) != len(fldlst):
+                    print('=== Not coherent 1')
+                    RAISE()
+
+                for i in range(len(fields)):
+                    if fields[i] != fldlst[i]:
+                        if verbose:
+                            print('=== Not coherent 2', pattern, s, 
+                                    outcome, maxsplit, fields, i, 
+                                    fields[i],'(',len(fields[i]),')', ' | ', 
+                                    fldlst[i],'(',len(fldlst[i]),')')
+                        else:
+                            print('=== Not coherent 2')
+                        RAISE()
+            else:
+                print ('=== Failed incorrectly', pattern, s, 
+                        outcome, maxsplit, fields)
+
+def test_re_mod_split(verbose = None):
+    """
+    test re.split()
+    """
+    regex_tests = testsuite.split_regex_tests
+    for t in regex_tests:
+        pattern, s, outcome, maxsplit, fields = t
+        try:
+            fldlst=re.split(pattern, s, maxsplit)
+        except:
+            if outcome==SYNTAX_ERROR:
+                # This should have been a syntax error; forget it.
+                continue
+            else:
+                print('=== Unexpected exception:', pattern, s, 
+                                    outcome, maxsplit, fields)
+
+        if outcome==FAIL:
+            pass    # No match, as expected
+        elif outcome==SUCCEED:
+            if fldlst:
+                # Matched, as expected, so now we compute the
+                # result string and compare it to our expected result.
+                if verbose:
+                    fldstr = fieldstr = ""
+                    for item in fldlst:
+                        fldstr = fldstr + str(item) + " | "
+                    for item in fields:
+                        fieldstr = fieldstr + str(item) + " | "
+                    print(fldstr, "~~~", fieldstr)
+
+                if len(fields) != len(fldlst):
+                    print('=== Not coherent 1')
+                    RAISE()
+
+                for i in range(len(fields)):
+                    if fields[i] != fldlst[i]:
+                        if verbose:
+                            print('=== Not coherent 2', pattern, s, 
+                                    outcome, maxsplit, fields, i, 
+                                    fields[i],'(',len(fields[i]),')', ' | ', 
+                                    fldlst[i],'(',len(fldlst[i]),')')
+                        else:
+                            print('=== Not coherent 2')
+                        RAISE()
+            else:
+                print ('=== Failed incorrectly', pattern, s, 
+                        outcome, maxsplit, fields)
+
+def test_re_obj_findall(verbose = None):
+    """
+    test re.compile(), and reobj.findall()
+    """
+    regex_tests = testsuite.findall_regex_tests
+    for t in regex_tests:
+        pattern, s, outcome, pos, fields = t
+        try:
+            reobj = re.compile(pattern)
+        except:
+            if outcome==SYNTAX_ERROR:
+                # This should have been a syntax error; forget it.
+                pass
+            else:
+                print('=== Unexpected exception:', pattern, s, 
+                                    outcome, pos, fields)
+        try:
+            fldlst=reobj.findall(s, pos)
+        except:
+            if outcome == SYNTAX_ERROR:
+                continue
+            else:
+                print('=== Unexpected exception:', pattern, s, 
+                                    outcome, pos, fields)
+
+        if outcome==FAIL:
+            pass    # No match, as expected
+        elif outcome==SUCCEED:
+            if fldlst:
+                # Matched, as expected, so now we compute the
+                # result string and compare it to our expected result.
+                if verbose:
+                    fldstr = fieldstr = ""
+                    for item in fldlst:
+                        fldstr = fldstr + str(item) + " | "
+                    for item in fields:
+                        fieldstr = fieldstr + str(item) + " | "
+                    print(fldstr, "~~~", fieldstr)
+
+                if len(fields) != len(fldlst):
+                    print('=== Not coherent 1')
+                    RAISE()
+
+                for i in range(len(fields)):
+                    if fields[i] != fldlst[i]:
+                        if verbose:
+                            print('=== Not coherent 2', pattern, s, 
+                                    outcome, maxsplit, fields, i, 
+                                    fields[i],'(',len(fields[i]),')', ' | ', 
+                                    fldlst[i],'(',len(fldlst[i]),')')
+                        else:
+                            print('=== Not coherent 2')
+                        RAISE()
+            else:
+                print ('=== Failed incorrectly', pattern, s, 
+                        outcome, pos, fields)
+
+def test_re_mod_findall(verbose = None):
+    """
+    test re.findall()
+    """
+    regex_tests = testsuite.mod_findall_regex_tests
+    for t in regex_tests:
+        pattern, s, outcome, pos, fields = t    # pos is not used
+        try:
+            fldlst=re.findall(pattern, s)
+        except:
+            if outcome==SYNTAX_ERROR:
+                # This should have been a syntax error; forget it.
+                continue
+            else:
+                print('=== Unexpected exception:', pattern, s, 
+                                    outcome, pos, fields)
+
+        if outcome==FAIL:
+            pass    # No match, as expected
+        elif outcome==SUCCEED:
+            if fldlst:
+                # Matched, as expected, so now we compute the
+                # result string and compare it to our expected result.
+                if verbose:
+                    fldstr = fieldstr = ""
+                    for item in fldlst:
+                        fldstr = fldstr + str(item) + " | "
+                    for item in fields:
+                        fieldstr = fieldstr + str(item) + " | "
+                    print(fldstr, "~~~", fieldstr)
+
+                if len(fields) != len(fldlst):
+                    print('=== Not coherent 1')
+                    RAISE()
+
+                for i in range(len(fields)):
+                    if fields[i] != fldlst[i]:
+                        if verbose:
+                            print('=== Not coherent 2', pattern, s, 
+                                    outcome, maxsplit, fields, i, 
+                                    fields[i],'(',len(fields[i]),')', ' | ', 
+                                    fldlst[i],'(',len(fldlst[i]),')')
+                        else:
+                            print('=== Not coherent 2')
+                        RAISE()
+            else:
+                print ('=== Failed incorrectly', pattern, s, 
+                        outcome, pos, fields)
+
+def test_mat_obj_groups(verbose = None):
+    """
+    test re.search(), and matobj.groups()
+    'verbose' is for debugging, when 'verbose' is true, print extra info
+    """
+    regex_tests = testsuite.matobj_groups_regex_tests
+    for t in regex_tests:
+        pattern, s, outcome, fields, grpidx, start, end = t
+        try:
+            matobj=re.search(pattern, s)
+        except:
+            if outcome==SYNTAX_ERROR:
+                # This should have been a syntax error; forget it.
+                continue
+            else:
+                print('=== Unexpected exception 1:', pattern, s, 
+                                    outcome,fields)
+
+        try:
+            if outcome==SUCCEED: assert(matobj != None)
+            fldlst = matobj.groups()
+        except:
+            if outcome==SYNTAX_ERROR:
+                # This should have been a syntax error; forget it.
+                continue
+            else:
+                print('=== Unexpected exception 2:', pattern, s, 
+                                    outcome,fields)
+           
+        if outcome==FAIL:
+            pass    # No match, as expected
+        elif outcome==SUCCEED:
+            if fldlst and fields:
+                # Matched, as expected, so now we compute the
+                # result string and compare it to our expected result.
+                if verbose:
+                    fldstr = fieldstr = ""
+                    for item in fldlst:
+                        fldstr = fldstr + str(item) + " | "
+                    for item in fields:
+                        fieldstr = fieldstr + str(item) + " | "
+                    print(fldstr, "~~~", fieldstr)
+
+                if len(fields) != len(fldlst):
+                    print('=== Not coherent 2')
+                    RAISE()
+
+                for i in range(len(fields)):
+                    if fields[i] != fldlst[i]:
+                        if verbose:
+                            print('=== Not coherent', pattern, s, 
+                                    outcome,fields, i, 
+                                    fields[i],'(',len(fields[i]),')', ' | ', 
+                                    fldlst[i],'(',len(fldlst[i]),')')
+                        else:
+                            print('=== Not coherent')
+                        RAISE()
+            elif not len(fldlst) and not len(fields):
+                # output is empty, as expected
+                if verbose:
+                    print("output is empty, as expected")
+                continue
+            else:
+                if verbose:
+                    for item in fldlst:
+                        print(item,)
+                    print()
+                    for item in fields: 
+                        print(item,)
+                    print()
+                print ('=== Failed incorrectly', pattern, s, 
+                        outcome,fields,fldlst)
+
+def test_mat_obj_start(verbose = None):
+    """
+    test re.search(), and matobj.start()
+    'verbose' is for debugging, when 'verbose' is true, print extra info
+    """
+    regex_tests = testsuite.matobj_groups_regex_tests
+    for t in regex_tests:
+        pattern, s, outcome, fields, grpidx, start, end = t
+        try:
+            matobj=re.search(pattern, s)
+        except:
+            if outcome==SYNTAX_ERROR:
+                # This should have been a syntax error; forget it.
+                continue
+            else:
+                print('=== Unexpected exception 1:', pattern, s, 
+                                    outcome,fields)
+
+        try:
+            if outcome==SUCCEED: assert(matobj != None)
+            fldlst = matobj.groups()
+        except:
+            if outcome==SYNTAX_ERROR:
+                # This should have been a syntax error; forget it.
+                continue
+            else:
+                print('=== Unexpected exception 2:', pattern, s, 
+                                    outcome,fields)
+           
+        if outcome==FAIL:
+            pass    # No match, as expected
+        elif outcome==SUCCEED:
+            if grpidx > 0:
+                if matobj.start(grpidx) == start:
+                    pass
+                else:
+                    if verbose:
+                        print ('=== Failed incorrectly', pattern, s, 
+                            outcome,fields,fldlst)
+                    raise("testing failed")
+
+
+def test_mat_obj_end(verbose = None):
+    """
+    test re.search(), and matobj.end()
+    'verbose' is for debugging, when 'verbose' is true, print extra info
+    """
+    regex_tests = testsuite.matobj_groups_regex_tests
+    for t in regex_tests:
+        pattern, s, outcome, fields, grpidx, start, end = t
+        try:
+            matobj=re.search(pattern, s)
+        except:
+            if outcome==SYNTAX_ERROR:
+                # This should have been a syntax error; forget it.
+                continue
+            else:
+                print('=== Unexpected exception 1:', pattern, s, 
+                                    outcome,fields)
+
+        try:
+            if outcome==SUCCEED: assert(matobj != None)
+            fldlst = matobj.groups()
+        except:
+            if outcome==SYNTAX_ERROR:
+                # This should have been a syntax error; forget it.
+                continue
+            else:
+                print('=== Unexpected exception 2:', pattern, s, 
+                                    outcome,fields)
+           
+        if outcome==FAIL:
+            pass    # No match, as expected
+        elif outcome==SUCCEED:
+            if grpidx > 0:
+                if matobj.end(grpidx) == end:
+                    pass
+                else:
+                    if verbose:
+                        print ('=== Failed incorrectly', pattern, s, 
+                            outcome,fields,fldlst, matobj.end(grpidx), end)
+                    raise("testing failed")
+
+def test_mat_obj_span(verbose = None):
+    """
+    test re.search(), and matobj.span()
+    'verbose' is for debugging, when 'verbose' is true, print extra info
+    """
+    regex_tests = testsuite.matobj_groups_regex_tests
+    for t in regex_tests:
+        pattern, s, outcome, fields, grpidx, start, end = t
+        try:
+            matobj=re.search(pattern, s)
+        except:
+            if outcome==SYNTAX_ERROR:
+                # This should have been a syntax error; forget it.
+                continue
+            else:
+                print('=== Unexpected exception 1:', pattern, s, 
+                                    outcome,fields)
+
+        try:
+            if outcome==SUCCEED: assert(matobj != None)
+            fldlst = matobj.groups()
+        except:
+            if outcome==SYNTAX_ERROR:
+                # This should have been a syntax error; forget it.
+                continue
+            else:
+                print('=== Unexpected exception 2:', pattern, s, 
+                                    outcome,fields)
+           
+        if outcome==FAIL:
+            pass    # No match, as expected
+        elif outcome==SUCCEED:
+            if (grpidx > 0):
+                spstart, spend = matobj.span(grpidx)
+                if spstart == start and spend == end:
+                    pass
+                else:
+                    if verbose:
+                        print ('=== Failed incorrectly', pattern, s, 
+                            outcome,fields,fldlst)
+                    raise("testing failed")
+
+if __name__ == "__main__":
+	main()
+
--- a/programs/develop/tinypy/modules/re/testsuite.py
+++ b/programs/develop/tinypy/modules/re/testsuite.py
@ -0,0 +1,367 @@
+# Test suite (for verifying correctness)
+#
+# The test suite is a list of 5- or 3-tuples.  The 5 parts of a
+# complete tuple are:
+# element 0: a string containing the pattern
+#         1: the string to match against the pattern
+#         2: the expected result (0 - SUCCEED, 1 - FAIL, 2 - SYNTAX_ERROR)
+#         3: a string that will be eval()'ed to produce a test string.
+#            This is an arbitrary Python expression; the available
+#            variables are "found" (the whole match), and "g1", "g2", ...
+#            up to "g10" contain the contents of each group, or the
+#            string 'None' if the group wasn't given a value.
+#         4: The expected result of evaluating the expression.
+#            If the two don't match, an error is reported.
+#
+# If the regex isn't expected to work, the latter two elements can be omitted.
+
+# test suite for search
+search_regex_tests=[
+['abc', 'abc', 0, 'found', 'abc'],
+['abc', 'xbc', 1],
+['abc', 'axc', 1],
+['abc', 'abx', 1],
+['abc', 'xabcy', 0, 'found', 'abc'],
+['abc', 'ababc', 0, 'found', 'abc'],
+['ab*c', 'abc', 0, 'found', 'abc'],
+['ab*bc', 'abc', 0, 'found', 'abc'],
+['ab*bc', 'abbc', 0, 'found', 'abbc'],
+['ab*bc', 'abbbbc', 0, 'found', 'abbbbc'],
+['ab+bc', 'abbc', 0, 'found', 'abbc'],
+['ab+bc', 'abc', 1],
+['ab+bc', 'abq', 1],
+['ab+bc', 'abbbbc', 0, 'found', 'abbbbc'],
+['ab?bc', 'abbc', 0, 'found', 'abbc'],
+['ab?bc', 'abc', 0, 'found', 'abc'],
+['ab?bc', 'abbbbc', 1],
+['ab?c', 'abc', 0, 'found', 'abc'],
+['^abc$', 'abc', 0, 'found', 'abc'],
+['^abc$', 'abcc', 1],
+['^abc', 'abcc', 0, 'found', 'abc'],
+['^abc$', 'aabc', 1],
+['abc$', 'aabc', 0, 'found', 'abc'],
+['^', 'abc', 0, 'found+"-"', '-'],
+['$', 'abc', 0, 'found+"-"', '-'],
+['a.c', 'abc', 0, 'found', 'abc'],
+['a.c', 'axc', 0, 'found', 'axc'],
+['a.*c', 'axyzc', 0, 'found', 'axyzc'],
+['a.*c', 'axyzd', 1],
+['a[bc]d', 'abc', 1],
+['a[bc]d', 'abd', 0, 'found', 'abd'],
+['a[b-d]e', 'abd', 1],
+['a[b-d]e', 'ace', 0, 'found', 'ace'],
+['a[b-d]', 'aac', 0, 'found', 'ac'],
+['a[-b]', 'a-', 0, 'found', 'a-'],
+['a[b-]', 'a-', 0, 'found', 'a-'],
+['a[]b', '-', 2],
+['a[', '-', 2],
+['a\\', '-', 2],
+['abc\\)', '-', 2],
+['\\(abc', '-', 2],
+['a]', 'a]', 0, 'found', 'a]'],
+['a[]]b', 'a]b', 0, 'found', 'a]b'],
+['a[^bc]d', 'aed', 0, 'found', 'aed'],
+['a[^bc]d', 'abd', 1],
+['a[^-b]c', 'adc', 0, 'found', 'adc'],
+['a[^-b]c', 'a-c', 1],
+['a[^]b]c', 'a]c', 1],
+['a[^]b]c', 'adc', 0, 'found', 'adc'],
+['\\ba\\b', 'a-', 0, '"-"', '-'],
+['\\ba\\b', '-a', 0, '"-"', '-'],
+['\\ba\\b', '-a-', 0, '"-"', '-'],
+['\\by\\b', 'xy', 1],
+['\\by\\b', 'yz', 1],
+['\\by\\b', 'xyz', 1],
+['ab\\|cd', 'abc', 0, 'found', 'ab'],
+['ab\\|cd', 'abcd', 0, 'found', 'ab'],
+['\\(\\)ef', 'def', 0, 'found+"-"+g1', 'ef-'],
+['$b', 'b', 1],
+['a(b', 'a(b', 0, 'found+"-"+g1', 'a(b-None'],
+['a(*b', 'ab', 0, 'found', 'ab'],
+['a(*b', 'a((b', 0, 'found', 'a((b'],
+['a\\\\b', 'a\\b', 0, 'found', 'a\\b'],
+['\\(\\(a\\)\\)', 'abc', 0, 'found+"-"+g1+"-"+g2', 'a-a-a'],
+['\\(a\\)b\\(c\\)', 'abc', 0, 'found+"-"+g1+"-"+g2', 'abc-a-c'],
+['a+b+c', 'aabbabc', 0, 'found', 'abc'],
+['\\(a+\\|b\\)*', 'ab', 0, 'found+"-"+g1', 'ab-b'],
+['\\(a+\\|b\\)+', 'ab', 0, 'found+"-"+g1', 'ab-b'],
+['\\(a+\\|b\\)?', 'ab', 0, 'found+"-"+g1', 'a-a'],
+['\\)\\(', '-', 2],
+['[^ab]*', 'cde', 0, 'found', 'cde'],
+['abc', '', 1],
+['a*', '', 0, 'found', ''],
+['a\\|b\\|c\\|d\\|e', 'e', 0, 'found', 'e'],
+['\\(a\\|b\\|c\\|d\\|e\\)f', 'ef', 0, 'found+"-"+g1', 'ef-e'],
+['abcd*efg', 'abcdefg', 0, 'found', 'abcdefg'],
+['ab*', 'xabyabbbz', 0, 'found', 'ab'],
+['ab*', 'xayabbbz', 0, 'found', 'a'],
+['\\(ab\\|cd\\)e', 'abcde', 0, 'found+"-"+g1', 'cde-cd'],
+['[abhgefdc]ij', 'hij', 0, 'found', 'hij'],
+['^\\(ab\\|cd\\)e', 'abcde', 1, 'xg1y', 'xy'],
+['\\(abc\\|\\)ef', 'abcdef', 0, 'found+"-"+g1', 'ef-'],
+['\\(a\\|b\\)c*d', 'abcd', 0, 'found+"-"+g1', 'bcd-b'],
+['\\(ab\\|ab*\\)bc', 'abc', 0, 'found+"-"+g1', 'abc-a'],
+['a\\([bc]*\\)c*', 'abc', 0, 'found+"-"+g1', 'abc-bc'],
+['a\\([bc]*\\)\\(c*d\\)', 'abcd', 0, 'found+"-"+g1+"-"+g2', 'abcd-bc-d'],
+['a\\([bc]+\\)\\(c*d\\)', 'abcd', 0, 'found+"-"+g1+"-"+g2', 'abcd-bc-d'],
+['a\\([bc]*\\)\\(c+d\\)', 'abcd', 0, 'found+"-"+g1+"-"+g2', 'abcd-b-cd'],
+['a[bcd]*dcdcde', 'adcdcde', 0, 'found', 'adcdcde'],
+['a[bcd]+dcdcde', 'adcdcde', 1],
+['\\(ab\\|a\\)b*c', 'abc', 0, 'found+"-"+g1', 'abc-ab'],
+['\\(\\(a\\)\\(b\\)c\\)\\(d\\)', 'abcd', 0, 'g1+"-"+g2+"-"+g3+"-"+g4', 'abc-a-b-d'],
+['[a-zA-Z_][a-zA-Z0-9_]*', 'alpha', 0, 'found', 'alpha'],
+['^a\\(bc+\\|b[eh]\\)g\\|.h$', 'abh', 0, 'found+"-"+g1', 'bh-None'],
+['\\(bc+d$\\|ef*g.\\|h?i\\(j\\|k\\)\\)', 'effgz', 0, 'found+"-"+g1+"-"+g2', 'effgz-effgz-None'],
+['\\(bc+d$\\|ef*g.\\|h?i\\(j\\|k\\)\\)', 'ij', 0, 'found+"-"+g1+"-"+g2', 'ij-ij-j'],
+['\\(bc+d$\\|ef*g.\\|h?i\\(j\\|k\\)\\)', 'effg', 1],
+['\\(bc+d$\\|ef*g.\\|h?i\\(j\\|k\\)\\)', 'bcdd', 1],
+['\\(bc+d$\\|ef*g.\\|h?i\\(j\\|k\\)\\)', 'reffgz', 0, 'found+"-"+g1+"-"+g2', 'effgz-effgz-None'],
+['\\(\\(\\(\\(\\(\\(\\(\\(\\(a\\)\\)\\)\\)\\)\\)\\)\\)\\)', 'a', 0, 'found', 'a'],
+['multiple words of text', 'uh-uh', 1],
+['multiple words', 'multiple words, yeah', 0, 'found', 'multiple words'],
+['\\(.*\\)c\\(.*\\)', 'abcde', 0, 'found+"-"+g1+"-"+g2', 'abcde-ab-de'],
+['(\\(.*\\), \\(.*\\))', '(a, b)', 0, 'g2+"-"+g1', 'b-a'],
+['[k]', 'ab', 1],
+['a[-]?c', 'ac', 0, 'found', 'ac'],
+['\\(abc\\)\\1', 'abcabc', 0, 'g1', 'abc'],
+['\\([a-c]*\\)\\1', 'abcabc', 0, 'g1', 'abc'],
+['^\\(.+\\)?B', 'AB', 0, 'g1', 'A'],
+['\\(a+\\).\\1$', 'aaaaa', 0, 'found+"-"+g1', 'aaaaa-aa'],
+['^\\(a+\\).\\1$', 'aaaa', 1],
+['\\(abc\\)\\1', 'abcabc', 0, 'found+"-"+g1', 'abcabc-abc'],
+['\\([a-c]+\\)\\1', 'abcabc', 0, 'found+"-"+g1', 'abcabc-abc'],
+['\\(a\\)\\1', 'aa', 0, 'found+"-"+g1', 'aa-a'],
+['\\(a+\\)\\1', 'aa', 0, 'found+"-"+g1', 'aa-a'],
+['\\(a+\\)+\\1', 'aa', 0, 'found+"-"+g1', 'aa-a'],
+['\\(a\\).+\\1', 'aba', 0, 'found+"-"+g1', 'aba-a'],
+['\\(a\\)ba*\\1', 'aba', 0, 'found+"-"+g1', 'aba-a'],
+['\\(aa\\|a\\)a\\1$', 'aaa', 0, 'found+"-"+g1', 'aaa-a'],
+['\\(a\\|aa\\)a\\1$', 'aaa', 0, 'found+"-"+g1', 'aaa-a'],
+['\\(a+\\)a\\1$', 'aaa', 0, 'found+"-"+g1', 'aaa-a'],
+['\\([abc]*\\)\\1', 'abcabc', 0, 'found+"-"+g1', 'abcabc-abc'],
+['\\(a\\)\\(b\\)c\\|ab', 'ab', 0, 'found+"-"+g1+"-"+g2', 'ab-None-None'],
+['\\(a\\)+x', 'aaax', 0, 'found+"-"+g1', 'aaax-a'],
+['\\([ac]\\)+x', 'aacx', 0, 'found+"-"+g1', 'aacx-c'],
+['\\([^/]*/\\)*sub1/', 'd:msgs/tdir/sub1/trial/away.cpp', 0, 'found+"-"+g1', 'd:msgs/tdir/sub1/-tdir/'],
+['\\([^.]*\\)\\.\\([^:]*\\):[T ]+\\(.*\\)', 'track1.title:TBlah blah blah', 0, 'found+"-"+g1+"-"+g2+"-"+g3', 'track1.title:TBlah blah blah-track1-title-Blah blah blah'],
+['\\([^N]*N\\)+', 'abNNxyzN', 0, 'found+"-"+g1', 'abNNxyzN-xyzN'],
+['\\([^N]*N\\)+', 'abNNxyz', 0, 'found+"-"+g1', 'abNN-N'],
+['\\([abc]*\\)x', 'abcx', 0, 'found+"-"+g1', 'abcx-abc'],
+['\\([abc]*\\)x', 'abc', 1],
+['\\([xyz]*\\)x', 'abcx', 0, 'found+"-"+g1', 'x-'],
+['\\(a\\)+b\\|aac', 'aac', 0, 'found+"-"+g1', 'aac-None'],
+['\\<a', 'a', 0, 'found', 'a'],
+['\\<a', '!', 1],
+['a\\<b', 'ab', 1],
+['a\\>', 'ab', 1],
+['a\\>', 'a!', 0, 'found', 'a'],
+['a\\>', 'a', 0, 'found', 'a'],
+]
+
+
+# test suite for match
+match_regex_tests=[
+['abc', 'abc', 0, 'found', 'abc'],
+['abc', 'xbc', 1],
+['abc', 'axc', 1],
+['abc', 'abx', 1],
+['abc', 'xabcy', 1],
+['abc', 'ababc', 1],
+['ab*c', 'abc', 0, 'found', 'abc'],
+['ab*bc', 'abc', 0, 'found', 'abc'],
+['ab*bc', 'abbc', 0, 'found', 'abbc'],
+['ab*bc', 'abbbbc', 0, 'found', 'abbbbc'],
+['ab+bc', 'abbc', 0, 'found', 'abbc'],
+['ab+bc', 'abc', 1],
+['ab+bc', 'abq', 1],
+['ab+bc', 'abbbbc', 0, 'found', 'abbbbc'],
+['ab?bc', 'abbc', 0, 'found', 'abbc'],
+['ab?bc', 'abc', 0, 'found', 'abc'],
+['ab?bc', 'abbbbc', 1],
+['ab?c', 'abc', 0, 'found', 'abc'],
+['^abc$', 'abc', 0, 'found', 'abc'],
+['^abc$', 'abcc', 1],
+['^abc', 'abcc', 0, 'found', 'abc'],
+['^abc$', 'aabc', 1],
+['abc$', 'aabc', 1],
+['^', 'abc', 0, 'found+"-"', '-'],
+['$', 'abc', 1],
+['a.c', 'abc', 0, 'found', 'abc'],
+['a.c', 'axc', 0, 'found', 'axc'],
+['a.*c', 'axyzc', 0, 'found', 'axyzc'],
+['a.*c', 'axyzd', 1],
+['a[bc]d', 'abc', 1],
+['a[bc]d', 'abd', 0, 'found', 'abd'],
+['a[b-d]e', 'abd', 1],
+['a[b-d]e', 'ace', 0, 'found', 'ace'],
+['a[b-d]', 'aac', 1],
+['a[-b]', 'a-', 0, 'found', 'a-'],
+['a[b-]', 'a-', 0, 'found', 'a-'],
+['a[]b', '-', 2],
+['a[', '-', 2],
+['a\\', '-', 2],
+['abc\\)', '-', 2],
+['\\(abc', '-', 2],
+['a]', 'a]', 0, 'found', 'a]'],
+['a[]]b', 'a]b', 0, 'found', 'a]b'],
+['a[^bc]d', 'aed', 0, 'found', 'aed'],
+['a[^bc]d', 'abd', 1],
+['a[^-b]c', 'adc', 0, 'found', 'adc'],
+['a[^-b]c', 'a-c', 1],
+['a[^]b]c', 'a]c', 1],
+['a[^]b]c', 'adc', 0, 'found', 'adc'],
+['\\ba\\b', 'a-', 0, '"-"', '-'],
+['\\ba\\b', '-a', 1],
+['\\ba\\b', '-a-', 1],
+['\\by\\b', 'xy', 1],
+['\\by\\b', 'yz', 1],
+['\\by\\b', 'xyz', 1],
+['ab\\|cd', 'abc', 0, 'found', 'ab'],
+['ab\\|cd', 'abcd', 0, 'found', 'ab'],
+['\\(\\)ef', 'def', 1],
+['$b', 'b', 1],
+['a(b', 'a(b', 0, 'found+"-"+g1', 'a(b-None'],
+['a(*b', 'ab', 0, 'found', 'ab'],
+['a(*b', 'a((b', 0, 'found', 'a((b'],
+['a\\\\b', 'a\\b', 0, 'found', 'a\\b'],
+['\\(\\(a\\)\\)', 'abc', 0, 'found+"-"+g1+"-"+g2', 'a-a-a'],
+['\\(a\\)b\\(c\\)', 'abc', 0, 'found+"-"+g1+"-"+g2', 'abc-a-c'],
+['a+b+c', 'aabbabc', 1],
+['\\(a+\\|b\\)*', 'ab', 0, 'found+"-"+g1', 'ab-b'],
+['\\(a+\\|b\\)+', 'ab', 0, 'found+"-"+g1', 'ab-b'],
+['\\(a+\\|b\\)?', 'ab', 0, 'found+"-"+g1', 'a-a'],
+['\\)\\(', '-', 2],
+['[^ab]*', 'cde', 0, 'found', 'cde'],
+['abc', '', 1],
+['a*', '', 0, 'found', ''],
+['a\\|b\\|c\\|d\\|e', 'e', 0, 'found', 'e'],
+['\\(a\\|b\\|c\\|d\\|e\\)f', 'ef', 0, 'found+"-"+g1', 'ef-e'],
+['abcd*efg', 'abcdefg', 0, 'found', 'abcdefg'],
+['ab*', 'xabyabbbz', 1],
+['ab*', 'xayabbbz', 1],
+['\\(ab\\|cd\\)e', 'abcde', 1],
+['[abhgefdc]ij', 'hij', 0, 'found', 'hij'],
+['^\\(ab\\|cd\\)e', 'abcde', 1, 'xg1y', 'xy'],
+['\\(abc\\|\\)ef', 'abcdef', 1],
+['\\(a\\|b\\)c*d', 'abcd', 1],
+['\\(ab\\|ab*\\)bc', 'abc', 0, 'found+"-"+g1', 'abc-a'],
+['a\\([bc]*\\)c*', 'abc', 0, 'found+"-"+g1', 'abc-bc'],
+['a\\([bc]*\\)\\(c*d\\)', 'abcd', 0, 'found+"-"+g1+"-"+g2', 'abcd-bc-d'],
+['a\\([bc]+\\)\\(c*d\\)', 'abcd', 0, 'found+"-"+g1+"-"+g2', 'abcd-bc-d'],
+['a\\([bc]*\\)\\(c+d\\)', 'abcd', 0, 'found+"-"+g1+"-"+g2', 'abcd-b-cd'],
+['a[bcd]*dcdcde', 'adcdcde', 0, 'found', 'adcdcde'],
+['a[bcd]+dcdcde', 'adcdcde', 1],
+['\\(ab\\|a\\)b*c', 'abc', 0, 'found+"-"+g1', 'abc-ab'],
+['\\(\\(a\\)\\(b\\)c\\)\\(d\\)', 'abcd', 0, 'g1+"-"+g2+"-"+g3+"-"+g4', 'abc-a-b-d'],
+['[a-zA-Z_][a-zA-Z0-9_]*', 'alpha', 0, 'found', 'alpha'],
+['^a\\(bc+\\|b[eh]\\)g\\|.h$', 'abh', 1],
+['\\(bc+d$\\|ef*g.\\|h?i\\(j\\|k\\)\\)', 'effgz', 0, 'found+"-"+g1+"-"+g2', 'effgz-effgz-None'],
+['\\(bc+d$\\|ef*g.\\|h?i\\(j\\|k\\)\\)', 'ij', 0, 'found+"-"+g1+"-"+g2', 'ij-ij-j'],
+['\\(bc+d$\\|ef*g.\\|h?i\\(j\\|k\\)\\)', 'effg', 1],
+['\\(bc+d$\\|ef*g.\\|h?i\\(j\\|k\\)\\)', 'bcdd', 1],
+['\\(bc+d$\\|ef*g.\\|h?i\\(j\\|k\\)\\)', 'reffgz', 1],
+['\\(\\(\\(\\(\\(\\(\\(\\(\\(a\\)\\)\\)\\)\\)\\)\\)\\)\\)', 'a', 0, 'found', 'a'],
+['multiple words of text', 'uh-uh', 1],
+['multiple words', 'multiple words, yeah', 0, 'found', 'multiple words'],
+['\\(.*\\)c\\(.*\\)', 'abcde', 0, 'found+"-"+g1+"-"+g2', 'abcde-ab-de'],
+['(\\(.*\\), \\(.*\\))', '(a, b)', 0, 'g2+"-"+g1', 'b-a'],
+['[k]', 'ab', 1],
+['a[-]?c', 'ac', 0, 'found', 'ac'],
+['\\(abc\\)\\1', 'abcabc', 0, 'g1', 'abc'],
+['\\([a-c]*\\)\\1', 'abcabc', 0, 'g1', 'abc'],
+['^\\(.+\\)?B', 'AB', 0, 'g1', 'A'],
+['\\(a+\\).\\1$', 'aaaaa', 0, 'found+"-"+g1', 'aaaaa-aa'],
+['^\\(a+\\).\\1$', 'aaaa', 1],
+['\\(abc\\)\\1', 'abcabc', 0, 'found+"-"+g1', 'abcabc-abc'],
+['\\([a-c]+\\)\\1', 'abcabc', 0, 'found+"-"+g1', 'abcabc-abc'],
+['\\(a\\)\\1', 'aa', 0, 'found+"-"+g1', 'aa-a'],
+['\\(a+\\)\\1', 'aa', 0, 'found+"-"+g1', 'aa-a'],
+['\\(a+\\)+\\1', 'aa', 0, 'found+"-"+g1', 'aa-a'],
+['\\(a\\).+\\1', 'aba', 0, 'found+"-"+g1', 'aba-a'],
+['\\(a\\)ba*\\1', 'aba', 0, 'found+"-"+g1', 'aba-a'],
+['\\(aa\\|a\\)a\\1$', 'aaa', 0, 'found+"-"+g1', 'aaa-a'],
+['\\(a\\|aa\\)a\\1$', 'aaa', 0, 'found+"-"+g1', 'aaa-a'],
+['\\(a+\\)a\\1$', 'aaa', 0, 'found+"-"+g1', 'aaa-a'],
+['\\([abc]*\\)\\1', 'abcabc', 0, 'found+"-"+g1', 'abcabc-abc'],
+['\\(a\\)\\(b\\)c\\|ab', 'ab', 0, 'found+"-"+g1+"-"+g2', 'ab-None-None'],
+['\\(a\\)+x', 'aaax', 0, 'found+"-"+g1', 'aaax-a'],
+['\\([ac]\\)+x', 'aacx', 0, 'found+"-"+g1', 'aacx-c'],
+['\\([^/]*/\\)*sub1/', 'd:msgs/tdir/sub1/trial/away.cpp', 0, 'found+"-"+g1', 'd:msgs/tdir/sub1/-tdir/'],
+['\\([^.]*\\)\\.\\([^:]*\\):[T ]+\\(.*\\)', 'track1.title:TBlah blah blah', 0, 'found+"-"+g1+"-"+g2+"-"+g3', 'track1.title:TBlah blah blah-track1-title-Blah blah blah'],
+['\\([^N]*N\\)+', 'abNNxyzN', 0, 'found+"-"+g1', 'abNNxyzN-xyzN'],
+['\\([^N]*N\\)+', 'abNNxyz', 0, 'found+"-"+g1', 'abNN-N'],
+['\\([abc]*\\)x', 'abcx', 0, 'found+"-"+g1', 'abcx-abc'],
+['\\([abc]*\\)x', 'abc', 1],
+['\\([xyz]*\\)x', 'abcx', 1],
+['\\(a\\)+b\\|aac', 'aac', 0, 'found+"-"+g1', 'aac-None'],
+['\\<a', 'a', 0, 'found', 'a'],
+['\\<a', '!', 1],
+['a\\<b', 'ab', 1],
+['a\\>', 'ab', 1],
+['a\\>', 'a!', 0, 'found', 'a'],
+['a\\>', 'a', 0, 'found', 'a'],
+]
+
+# test suite for split()
+# element 0: pattern
+#         1: string to split
+#         3: compile result
+#         4: maxsplit
+#         5: splitted fields list
+split_regex_tests = [
+["[ |,]", "with you, nothing, and me", 0, 0, ["with","you","nothing","and","me"]],
+["[ |,]", "with you, nothing, and me", 0, 1, ["with", "you, nothing, and me"]],
+["\\ ", "send email to apply", 0, 0, ["send", "email", "to", "apply"]],
+["\\ ", "send email to apply", 0, 2, ["send", "email", "to apply"]],
+["[+ | -]", "+86-028-83201034", 0, 0, ["86", "028", "83201034"]],
+["[+ | -]", "+86-028-83201034", 0, 1, ["86", "028-83201034"]],
+["[*|#]", "slide show", 0, 0, ["slide show"]],
+["(", "whats ever", 0, 1, ["whats ever"]],
+["@#!~$%^&*()<>\n", "who knows", 0, 1, ["who knows"]],
+]
+
+# test suite for findall()
+# element 0: pattern
+#         1: string to match
+#         3: compile result
+#         4: starting position
+#         5: grouped fields list
+
+# reobj.find()
+findall_regex_tests = [
+["\\ ", "send email to apply", 0, 0, [" ", " ", " "]],
+["\\ ", "send email to apply", 0, 5, [" ", " "]],
+["[+ | -]", "+86-028-83201034", 0, 0, ["+", "-", "-"]],
+["[+ | -]", "+86-028-83201034", 0, 1, ["-", "-"]],
+["sl.*e\\|#", "slide show at Room #3", 0, 0, ["slide", "#"]],
+["w.+s\\|e.*r", "whats ever", 0, 0, ["whats", "ever"]],
+["Euler\\|Gauss", "Both Euler and Gauss are great mathematicians", 0, 0, ["Euler", "Gauss"]],
+]
+
+# module re.findall()
+mod_findall_regex_tests = [
+["\\ ", "send email to apply", 0, 0, [" ", " ", " "]],
+["\\ ", "send email to apply", 0, 0, [" ", " ", " "]],
+["[+ | -]", "+86-028-83201034", 0, 0, ["+", "-", "-"]],
+["[+ | -]", "+86-028-83201034", 0, 0, ["+", "-", "-"]],
+["sl.*e\\|#", "slide show at Room #3", 0, 0, ["slide", "#"]],
+["w.+s\\|e.*r", "whats ever", 0, 0, ["whats", "ever"]],
+["Euler\\|Gauss", "Both Euler and Gauss are great mathematicians", 0, 0, ["Euler", "Gauss"]],
+]
+
+# test for match object's groups() method
+# element 0: pattern
+#		  1: string
+#		  2: compile result
+#		  3: matched fields, for groups()
+#		  4: group index, valid when > 0, for start(), end(), and span()
+#		  5: pattern's starting index in string, for start() and span()
+#		  6: pattern's ending index in string, for end() and span
+matobj_groups_regex_tests = [
+["\\(abc\\(.*xyz\\)\\(.*31415926\\)\\)", "where is abc and flurry xyz, which is pi 31415926, derived from ms", 0, ["abc and flurry xyz, which is pi 31415926"," and flurry xyz",", which is pi 31415926"], 2, 12, 27],
+
+["[a\\|b]\\(.+\\)shoe\\([t]+\\)d", "bbbshoetttdxrznmlkjp", 0, ["bb", "ttt"], 1, 1, 3],
+
+["abcdef", "xyah2oewoyqe030uabcdefwhalsdewnkhgiohyczb", 0, [], -1, 0, 0],
+]
+