1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218
|
# rnc.py - functions for handling Dominican Republic tax registration
# coding: utf-8
#
# Copyright (C) 2015-2024 Arthur de Jong
#
# This library is free software; you can redistribute it and/or
# modify it under the terms of the GNU Lesser General Public
# License as published by the Free Software Foundation; either
# version 2.1 of the License, or (at your option) any later version.
#
# This library is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
# Lesser General Public License for more details.
#
# You should have received a copy of the GNU Lesser General Public
# License along with this library; if not, write to the Free Software
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
# 02110-1301 USA
# Development of this functionality was funded by iterativo | https://iterativo.do
"""RNC (Registro Nacional del Contribuyente, Dominican Republic tax number).
The RNC is the Dominican Republic taxpayer registration number for
institutions. The number consists of 9 digits.
>>> validate('1-01-85004-3')
'101850043'
>>> validate('1018A0043')
Traceback (most recent call last):
...
InvalidFormat: ...
>>> validate('101850042')
Traceback (most recent call last):
...
InvalidChecksum: ...
>>> format('131246796')
'1-31-24679-6'
"""
from __future__ import annotations
import json
from stdnum.exceptions import *
from stdnum.util import clean, get_soap_client, isdigits
# list of RNCs that do not match the checksum but are nonetheless valid
whitelist = set('''
101581601 101582245 101595422 101595785 10233317 131188691 401007374
501341601 501378067 501620371 501651319 501651823 501651845 501651926
501656006 501658167 501670785 501676936 501680158 504654542 504680029
504681442 505038691
'''.split())
dgii_wsdl = 'https://www.dgii.gov.do/wsMovilDGII/WSMovilDGII.asmx?WSDL'
"""The WSDL URL of DGII validation service."""
def compact(number: str) -> str:
"""Convert the number to the minimal representation. This strips the
number of any valid separators and removes surrounding whitespace."""
return clean(number, ' -').strip()
def calc_check_digit(number: str) -> str:
"""Calculate the check digit."""
weights = (7, 9, 8, 6, 5, 4, 3, 2)
check = sum(w * int(n) for w, n in zip(weights, number)) % 11
return str((10 - check) % 9 + 1)
def validate(number: str) -> str:
"""Check if the number provided is a valid RNC."""
number = compact(number)
if not isdigits(number):
raise InvalidFormat()
if number in whitelist:
return number
if len(number) != 9:
raise InvalidLength()
if calc_check_digit(number[:-1]) != number[-1]:
raise InvalidChecksum()
return number
def is_valid(number: str) -> bool:
"""Check if the number provided is a valid RNC."""
try:
return bool(validate(number))
except ValidationError:
return False
def format(number: str) -> str:
"""Reformat the number to the standard presentation format."""
number = compact(number)
return '-'.join((number[:1], number[1:3], number[3:-1], number[-1]))
def _convert_result(result: str) -> dict[str, str]: # pragma: no cover
"""Translate SOAP result entries into dicts."""
translation = {
'RGE_RUC': 'rnc',
'RGE_NOMBRE': 'name',
'NOMBRE_COMERCIAL': 'commercial_name',
'CATEGORIA': 'category',
'REGIMEN_PAGOS': 'payment_regime',
'ESTATUS': 'status',
'RNUM': 'result_number',
}
return dict(
(translation.get(key, key), value)
for key, value in json.loads(result.replace('\n', '\\n').replace('\t', '\\t')).items())
def check_dgii(
number: str,
timeout: float = 30,
verify: bool | str = True,
) -> dict[str, str] | None: # pragma: no cover
"""Lookup the number using the DGII online web service.
This uses the validation service run by the the Dirección General de
Impuestos Internos, the Dominican Republic tax department to lookup
registration information for the number.
The `timeout` argument specifies the network timeout in seconds.
The `verify` argument is either a boolean that determines whether the
server's certificate is validate or a string which must be a path the CA
certificate bundle to use for verification.
Returns a dict with the following structure::
{
'rnc': '123456789', # The requested number
'name': 'The registered name',
'commercial_name': 'An additional commercial name',
'status': '2', # 1: inactive, 2: active
'category': '0', # always 0?
'payment_regime': '2', # 1: N/D, 2: NORMAL, 3: PST
}
Will return None if the number is invalid or unknown."""
# this function isn't automatically tested because it would require
# network access for the tests and unnecessarily load the online service
number = compact(number)
client = get_soap_client(dgii_wsdl, timeout=timeout, verify=verify)
result = client.GetContribuyentes(
value=number,
patronBusqueda=0, # search type: 0=by number, 1=by name
inicioFilas=1, # start result (1-based)
filaFilas=1, # end result
IMEI='')
if result and 'GetContribuyentesResult' in result:
result = result['GetContribuyentesResult'] # PySimpleSOAP only
if result == '0':
return None
result = [x for x in result.split('@@@')]
return _convert_result(result[0])
def search_dgii(
keyword: str,
end_at: int = 10,
start_at: int = 1,
timeout: float = 30,
verify: bool | str = True,
) -> list[dict[str, str]]: # pragma: no cover
"""Search the DGII online web service using the keyword.
This uses the validation service run by the the Dirección General de
Impuestos Internos, the Dominican Republic tax department to search the
registration information using the keyword.
The number of entries returned can be tuned with the `end_at` and
`start_at` arguments.
The `timeout` argument specifies the network timeout in seconds.
The `verify` argument is either a boolean that determines whether the
server's certificate is validate or a string which must be a path the CA
certificate bundle to use for verification.
Returns a list of dicts with the following structure::
[
{
'rnc': '123456789', # The found number
'name': 'The registered name',
'commercial_name': 'An additional commercial name',
'status': '2', # 1: inactive, 2: active
'category': '0', # always 0?
'payment_regime': '2', # 1: N/D, 2: NORMAL, 3: PST
'result_number': '1', # index of the result
},
...
]
Will return an empty list if the number is invalid or unknown."""
# this function isn't automatically tested because it would require
# network access for the tests and unnecessarily load the online service
client = get_soap_client(dgii_wsdl, timeout=timeout, verify=verify)
results = client.GetContribuyentes(
value=keyword,
patronBusqueda=1, # search type: 0=by number, 1=by name
inicioFilas=start_at, # start result (1-based)
filaFilas=end_at, # end result
IMEI='')
if results and 'GetContribuyentesResult' in results:
results = results['GetContribuyentesResult'] # PySimpleSOAP only
if results == '0':
return []
return [_convert_result(result) for result in results.split('@@@')]
|