-
-
Save ryanmerolle/285df99b97c3bfea20a9f57e1c29cecd to your computer and use it in GitHub Desktop.
Python IPV4 / IPV6 Regular Expressions (REGEX)
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
# Constructed with help from | |
# http://stackoverflow.com/questions/53497/regular-expression-that-matches-valid-ipv6-addresses | |
# Try it on regex101: https://regex101.com/r/yVdrJQ/1 | |
import re | |
IPV4SEG = r'(?:25[0-5]|(?:2[0-4]|1{0,1}[0-9]){0,1}[0-9])' | |
IPV4ADDR = r'(?:(?:' + IPV4SEG + r'\.){3,3}' + IPV4SEG + r')' | |
IPV6SEG = r'(?:(?:[0-9a-fA-F]){1,4})' | |
IPV6GROUPS = ( | |
r'(?:' + IPV6SEG + r':){7,7}' + IPV6SEG, # 1:2:3:4:5:6:7:8 | |
r'(?:' + IPV6SEG + r':){1,7}:', # 1:: 1:2:3:4:5:6:7:: | |
r'(?:' + IPV6SEG + r':){1,6}:' + IPV6SEG, # 1::8 1:2:3:4:5:6::8 1:2:3:4:5:6::8 | |
r'(?:' + IPV6SEG + r':){1,5}(?::' + IPV6SEG + r'){1,2}', # 1::7:8 1:2:3:4:5::7:8 1:2:3:4:5::8 | |
r'(?:' + IPV6SEG + r':){1,4}(?::' + IPV6SEG + r'){1,3}', # 1::6:7:8 1:2:3:4::6:7:8 1:2:3:4::8 | |
r'(?:' + IPV6SEG + r':){1,3}(?::' + IPV6SEG + r'){1,4}', # 1::5:6:7:8 1:2:3::5:6:7:8 1:2:3::8 | |
r'(?:' + IPV6SEG + r':){1,2}(?::' + IPV6SEG + r'){1,5}', # 1::4:5:6:7:8 1:2::4:5:6:7:8 1:2::8 | |
IPV6SEG + r':(?:(?::' + IPV6SEG + r'){1,6})', # 1::3:4:5:6:7:8 1::3:4:5:6:7:8 1::8 | |
r':(?:(?::' + IPV6SEG + r'){1,7}|:)', # ::2:3:4:5:6:7:8 ::2:3:4:5:6:7:8 ::8 :: | |
r'fe80:(?::' + IPV6SEG + r'){0,4}%[0-9a-zA-Z]{1,}', # fe80::7:8%eth0 fe80::7:8%1 (link-local IPv6 addresses with zone index) | |
r'::(?:ffff(?::0{1,4}){0,1}:){0,1}[^\s:]' + IPV4ADDR, # ::255.255.255.255 ::ffff:255.255.255.255 ::ffff:0:255.255.255.255 (IPv4-mapped IPv6 addresses and IPv4-translated addresses) | |
r'(?:' + IPV6SEG + r':){1,6}:?[^\s:]' + IPV4ADDR, # 2001:db8:3:4::192.0.2.33 64:ff9b::192.0.2.33 (IPv4-Embedded IPv6 Address) | |
) | |
IPV6ADDR = '|'.join(['(?:{})'.format(g) for g in IPV6GROUPS[::-1]]) # Reverse rows for greedy match | |
tests = [ | |
'1::', | |
'1:2:3:4:5:6:7::', | |
'1::8', | |
'1:2:3:4:5:6::8', | |
'1:2:3:4:5:6::8', | |
'1::7:8', | |
'1:2:3:4:5::7:8', | |
'1:2:3:4:5::8', | |
'1::6:7:8', | |
'1:2:3:4::6:7:8', | |
'1:2:3:4::8', | |
'1::5:6:7:8', | |
'1:2:3::5:6:7:8', | |
'1:2:3::8', | |
'1::4:5:6:7:8', | |
'1:2::4:5:6:7:8', | |
'1:2::8', | |
'1::3:4:5:6:7:8', | |
'1::3:4:5:6:7:8', | |
'1::8', | |
'::2:3:4:5:6:7:8', | |
'::2:3:4:5:6:7:8', | |
'::8', | |
'::', | |
'fe80::7:8%eth0', | |
'fe80::7:8%1', | |
'::255.255.255.255', | |
'::ffff:255.255.255.255', | |
'::ffff:0:255.255.255.255', | |
'2001:db8:3:4::192.0.2.33', | |
'64:ff9b::192.0.2.33', | |
] | |
# IPV6ADDR Tests | |
def test_individual(tests): | |
for t in tests: | |
assert re.search(IPV6ADDR, t).group() == t | |
# MULTILINE | |
def test_multiline(tests): | |
_tests = tests[:] | |
for t in re.findall(IPV6ADDR, ' '.join(tests)): | |
_tests.remove(t) | |
assert not _tests | |
test_individual(tests) | |
test_multiline(tests) |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment