# 💠 Regex Examples


In [0]:
import re

## 🖼️ Images
- `.jpg`, `.png` and `.gif`

In [0]:
FILES = "esma.jpg ESMA.png asmaa.gif song.mp3 code.m example.wav bird.jpeg"

In [68]:
re.findall("\S+.(?:jpg|png|gif)", FILES)

['esma.jpg', 'ESMA.png', 'asmaa.gif']

## 🌎 HTML tags

In [0]:
TAGS = "<html> </b> <h2> </code> non-tag random notHTML <> </> < >"

In [70]:
re.findall('</{,1}[^(>|\s)]+>', TAGS)

['<html>', '</b>', '<h2>', '</code>', '</>']

In [71]:
re.findall(r"<\/?([^(\/>|\s)])+>", TAGS)

['l', 'b', '2', 'e']

> TODO: investigate this 🙄

## 📧 Email Addresses

In [0]:
EMAILS = 'esma@gmail.com asmaa@ogr.iu.edu.tr asmaa.mirkhan@example.com not.an@email just.aString'

In [73]:
re.findall('\S+[@]{1}\w+[.]+\S+', EMAILS)

['esma@gmail.com', 'asmaa@ogr.iu.edu.tr', 'asmaa.mirkhan@example.com']

## 📅 Dates

In [0]:
DATE_FORMATS = "21-05-2020 \n 21/05/2020 \n 21/05/20 \n 5/21/2020 \n 1 Jul 2020 \n 1 July 2020 \n Jul 1, 2020 \n July 1, 2020"

### 🔢 Numerical Dates

In [75]:
re.findall('\d{1,2}[/-]\d{1,2}[/-]\d{2,4}', DATE_FORMATS)

['21-05-2020', '21/05/2020', '21/05/20', '5/21/2020']

### 🔠 Alphanumerical Dates

In [76]:
re.findall('\d{1,2} (Jan|Feb|Mar|Apr|May|Jun|Jul|Aug|Sep|Oct|Nov|Dec) \d{2,4}', DATE_FORMATS)

['Jul']

In [77]:
re.findall('\d{1,2} (?:Jan|Feb|Mar|Apr|May|Jun|Jul|Aug|Sep|Oct|Nov|Dec) \d{2,4}', DATE_FORMATS)

['1 Jul 2020']

In [78]:
re.findall('\d{1,2} (?:Jan|Feb|Mar|Apr|May|Jun|Jul|Aug|Sep|Oct|Nov|Dec)[a-z]* \d{2,4}', DATE_FORMATS)

['1 Jul 2020', '1 July 2020']

In [79]:
re.findall('(?:\d{1,2} )?(?:Jan|Feb|Mar|Apr|May|Jun|Jul|Aug|Sep|Oct|Nov|Dec)[a-z]* (?:\d{1,2}, )?\d{4}', DATE_FORMATS)

['1 Jul 2020', '1 July 2020', 'Jul 1, 2020', 'July 1, 2020']