aboutsummaryrefslogtreecommitdiffstats
path: root/tools/generate-bacnet-vendors.py
blob: d068d3ebd722f5c32f5ea94f457d4f01c41e245a (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
#!/usr/bin/env python2

'''
 Copyright 2014 Anish Bhatt <anish@chelsio.com>

 This program is free software; you can redistribute it and/or
 modify it under the terms of the GNU General Public License
 as published by the Free Software Foundation; either version 2
 of the License, or (at your option) any later version.

 This program is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU General Public License for more details.

 You should have received a copy of the GNU General Public License
 along with this program; if not, write to the Free Software
 Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
'''

from bs4 import BeautifulSoup
import urllib
import sys
import string
# Required to convert accents/diaeresis etc.
import translitcodec

f = urllib.urlopen("http://www.bacnet.org/VendorID/BACnet%20Vendor%20IDs.htm")
html = f.read()
soup = BeautifulSoup(''.join(html))

entry = "static const value_string\nBACnetVendorIdentifiers [] = {"
table = soup.find('table')

rows = table.findAll('tr')

for tr in rows:
  cols = tr.findAll('td')
  for index,td in enumerate(cols[0:2]):
    text = ''.join(td.find(text=True))
    if index == 0:
      entry = "    { %3s" % text
    else:
      entry += ", \"%s\" }," % text.rstrip()
  # Required specially for "Dorsette's Inc." due to malformed html
  entry = entry.replace(u'\u0092', u'\'')
  # Required to convert accents/diaeresis etc.
  entry = entry.encode('translit/long')
  # Encode to ascii so we can out to file
  entry = entry.encode("ascii",'ignore')
  print entry

entry = "    { 0, NULL }\n};"
print entry.encode("ascii")