# *************************************************************************** # * * # * Copyright (c) 2018 Yorik van Havre * # * * # * This program is free software; you can redistribute it and/or modify * # * it under the terms of the GNU Lesser General Public License (LGPL) * # * as published by the Free Software Foundation; either version 2 of * # * the License, or (at your option) any later version. * # * for detail see the LICENCE text file. * # * * # * This program is distributed in the hope that it will be useful, * # * but WITHOUT ANY WARRANTY; without even the implied warranty of * # * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * # * GNU Library General Public License for more details. * # * * # * You should have received a copy of the GNU Library General Public * # * License along with this program; if not, write to the Free Software * # * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 * # * USA * # * * # *************************************************************************** """This script retrieves a list of standard property sets from the IFC4 official documentation website and stores them into a pset_dfinitions.xml files in the current directory. Warning, this can take a certain time (there are more than 400 definitions to retrieve)""" import codecs, os, re from urllib.request import urlopen MAXTRIES = 3 IFC_DOCS_ROOT_URL = "https://standards.buildingsmart.org/IFC/DEV/IFC4_2/FINAL/HTML/" # read the pset list print("Getting psets list...") u = urlopen( IFC_DOCS_ROOT_URL + "annex/annex-b/alphabeticalorder_psets.htm" ) p = u.read().decode('utf-8') u.close() psets = re.findall(r">Pset_(.*?)", p) # retrieve xml data from each Pset type psetdefs = "" failed = [] for i, pset in enumerate(psets): print(i + 1, "/", len(psets), ": Retrieving Pset", pset) for j in range(MAXTRIES): try: u = urlopen( IFC_DOCS_ROOT_URL + "psd/Pset_" + pset + ".xml" ) p = u.read().decode('utf-8') u.close() except: print(" Connection failed. trying one more time...") else: break else: print(" Unable to retrieve ", pset, ". Skipping...") failed.append(pset) psetdefs += p psetdefs = psetdefs.replace('', "") psetdefs = '\n\n' + psetdefs + "" f = codecs.open("pset_definitions.xml", "wb", "utf-8") f.write(psetdefs) f.close() print( "All done! writing " + os.path.join(os.path.abspath(os.curdir), "pset_definitions.xml") ) if failed: print("The following psets failed and were not retrieved:", failed)