File: generate-bacnet-vendors.py

package info (click to toggle)

wireshark 2.2.4%2Bgcc3dc1b-1~bpo8%2B1

links: PTS, VCS
area: main
in suites: jessie-backports
size: 219,640 kB
sloc: ansic: 2,167,318; cpp: 74,818; xml: 72,255; python: 31,527; perl: 26,604; makefile: 9,716; lex: 6,888; sh: 6,376; pascal: 4,608; yacc: 242; asm: 156; awk: 58; tcl: 35

file content (54 lines) | stat: -rwxr-xr-x 1,745 bytes

#!/usr/bin/env python2

'''
 Copyright 2014 Anish Bhatt <anish@chelsio.com>

 This program is free software; you can redistribute it and/or
 modify it under the terms of the GNU General Public License
 as published by the Free Software Foundation; either version 2
 of the License, or (at your option) any later version.

 This program is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU General Public License for more details.

 You should have received a copy of the GNU General Public License
 along with this program; if not, write to the Free Software
 Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
'''

from bs4 import BeautifulSoup
import urllib
import sys
import string
# Required to convert accents/diaeresis etc.
import translitcodec

f = urllib.urlopen("http://www.bacnet.org/VendorID/BACnet%20Vendor%20IDs.htm")
html = f.read()
soup = BeautifulSoup(''.join(html))

entry = "static const value_string\nBACnetVendorIdentifiers [] = {"
table = soup.find('table')

rows = table.findAll('tr')

for tr in rows:
  cols = tr.findAll('td')
  for index,td in enumerate(cols[0:2]):
    text = ''.join(td.find(text=True))
    if index == 0:
      entry = "    { %3s" % text
    else:
      entry += ", \"%s\" }," % text.rstrip()
  # Required specially for "Dorsette's Inc." due to malformed html
  entry = entry.replace(u'\u0092', u'\'')
  # Required to convert accents/diaeresis etc.
  entry = entry.encode('translit/long')
  # Encode to ascii so we can out to file
  entry = entry.encode("ascii",'ignore')
  print entry

entry = "    { 0, NULL }\n};"
print entry.encode("ascii")