szczys/tokenizer_by_split.py Secret

## tokenizer_by_split.py
def tokenize(instring, delimiters=[',',':',';','[',']','+','-']):
    '''
    Tokenize a string of ASM code, splitting based on special characters
    but at the same time including delimiters (but not whitespace) in the set
    '''
    tokens = instring.split()
    for d in delimiters:
        newtokens = list()
        for t in tokens:
            raw = t.split(d)
            for r_idx, r_token in enumerate(raw):
                if r_token != '':
                    '''
                    element will be empty when delimiter begins or
                    ends the string that was split
                    so don't add empty elements
                    '''
                    newtokens.append(r_token)
                if r_idx != len(raw)-1:
                    newtokens.append(d)
        tokens = newtokens
    return tokens

test = "MOV [ R7  :R8],R0 ; Testing stuff"
print(tokenize(test))
	def tokenize(instring, delimiters=[',',':',';','[',']','+','-']):
	'''
	Tokenize a string of ASM code, splitting based on special characters
	but at the same time including delimiters (but not whitespace) in the set
	'''
	tokens = instring.split()
	for d in delimiters:
	newtokens = list()
	for t in tokens:
	raw = t.split(d)
	for r_idx, r_token in enumerate(raw):
	if r_token != '':
	'''
	element will be empty when delimiter begins or
	ends the string that was split
	so don't add empty elements
	'''
	newtokens.append(r_token)
	if r_idx != len(raw)-1:
	newtokens.append(d)
	tokens = newtokens
	return tokens

	test = "MOV [ R7 :R8],R0 ; Testing stuff"
	print(tokenize(test))