""" # Total visited links visited = [] # Total working links found urls = [] resources = [] # Create excel file # wb = Workbook() # filename = input("Enter a title for the excel file: ") url = input("Enter url to crawl: ") resource = Resource(url) resource.get_resource_data() resource_values = { "title": resource.title, "url": resource.link, "link status": resource.status, "resource types": resource.resource_type, "disciplines": resource.themes, "organization": resource.get_org(), "organization validated in VIAF": resource.org.validated, "VIAF uri": resource.org.uri, "contact organization": resource.resource_contact_org, "contact name": resource.resource_contact_person_name, "contact email": resource.resource_contact_email, "contact phone": resource.resource_contact_phone, }
Program begins. """ # Total visited links visited = [] # Total working links found urls = [] resources = [] # Create excel file # wb = Workbook() # filename = input("Enter a title for the excel file: ") url = input("Enter url to crawl: ") resource = Resource(url) resource.get_resource_data() resource_values = { 'title': resource.title, 'url': resource.link, 'link status': resource.status, #'resource types': resource.resource_type, 'disciplines': resource.themes, 'organization': resource.get_org(), 'organization validated in VIAF': resource.org.validated, 'VIAF uri': resource.org.uri, 'contact organization': resource.resource_contact_org, 'contact name': resource.resource_contact_person_name, 'contact email': resource.resource_contact_email, 'contact phone': resource.resource_contact_phone } fieldnames = [