Doesn't this do what you want? import re
DATE_TIME_RE = re.compile(r'<td>((\d{2}\/\d{2}\/\d{4})|(\d{2}:\d{2}))<\/td>') test = '<td>04/01/2006</td>' \ '<td>Wednesday</td>' \ '<td> </td>' \ '<td>09:14</td>' \ '<td>12:44</td>' \ '<td>12:50</td>' \ '<td>17:58</td>' \ '<td> </td>' \ '<td> </td>' \ '<td> </td>' \ '<td> </td>' \ '<td>08:14</td>' out = [m[0] for m in DATE_TIME_RE.findall(test)] for m in out: print m -- http://mail.python.org/mailman/listinfo/python-list