import os, sys from datetime import datetime from dateutil import relativedelta sys.path.append('/var/www/digisnaxx.ado/scrapers') import dtss dtss.getReady() from time import sleep from pprint import pprint as ppr import pytz from events.models import Organization, Scraper import events.digitools as digitools count = 0 tz = pytz.timezone("US/Central") DATETIME_FORMAT = '%a, %b %d %Y %I%p' DATETIME_FORMAT_2 = '%a, %b %d %Y %I:%M %p SHOW' venue, created = Organization.objects.get_or_create( name="Icehouse", city="Minneapolis", website = "https://icehouse.turntabletickets.com", is_venue = True ) scraper,item_count_start,virtcal = digitools.getScraper(venue, venue.website, 'msp') def get_events(ps, event_type): contents = ps.xpath('.//*/div[@class="performances whitespace-pre-line w-full md:w-3/4"]') for c in contents: try: event = {} event['scraper'] = scraper event['calendars'] = scraper.calendar event['title'] = c.xpath('.//*/h3[@class="text-3xl font-semibold font-heading mr-auto"]/text()')[0] event['link'] = venue.website + c.xpath('.//*/a[@class="show-link"]/@href')[0] event['date'] = c.xpath('.//*/h4[@class="day-of-week"]/text()')[0] month = event['date'].split(' ')[1].strip() print("MONTH: ", month) year = int(datetime.today().year) if month in ['Jan', 'Feb', 'Mar']: year = year + 1 time = c.xpath('.//p/span/text()')[0][:4].strip() if time[-1:] == 'm': event['dateStamp'] = event['date'] + ' ' + str(year) + ' ' + time event['dateStamp'] =datetime.strptime(event['dateStamp'], DATETIME_FORMAT) digitools.createBasicEvent(event, event_type, venue) else: ppr(event) print("MONTH: ", month) except Exception as e: print("What?",e,"\n\n+++") if len(sys.argv) >= 2: arg1 = sys.argv[1] br = digitools.getBrowser(arg1) else: print("No run_env") quit() ps = digitools.getSource(br, venue.website) br.execute_script("window.scrollTo(0, window.scrollY + 5000)") get_events(ps, "Mu") # ppr(events) br.close() digitools.updateScraper(scraper, item_count_start)