I developed this feature that I think can be improved quite a bit. The result is the desired one, but it took me many lines of code. Any idea to optimize it?
import json
import urllib.request
dni = 71179047
def get_cuit(dni):
request = urllib.request.Request('https://www.cuitonline.com/search.php?q=' + str(dni))
response = urllib.request.urlopen(request)
data_content = response.read()
html = data_content.decode('ISO-8859-1')
cuit = re.findall(r"\(?\b[0-9]{2}\)?-?[0-9]{7,8}-[0-9]{1}\b", html)[0]
result = re.sub('[^0-9]','', cuit)
return result
get_cuit(dni)