„ical2csv.py“ ändern
Migrate https://github.com/erikcox/ical2csv/pull/13
This commit is contained in:
parent
cb2bc45191
commit
84b4b8b843
100
ical2csv.py
100
ical2csv.py
@ -3,8 +3,24 @@
|
||||
import sys
|
||||
import os.path
|
||||
from icalendar import Calendar
|
||||
import recurring_ical_events
|
||||
from bs4 import BeautifulSoup
|
||||
import warnings
|
||||
from dateutil.parser import parse
|
||||
import datetime
|
||||
import csv
|
||||
|
||||
warnings.filterwarnings("ignore", category=UserWarning, module='bs4') # We don't want warnings about URL's. We just what the URL printed, if there.
|
||||
|
||||
if len(sys.argv) <= 1:
|
||||
print("Please call this script with an ics-file as parameter.\n")
|
||||
print("Even better, call it with start and end dates:\n")
|
||||
print(sys.argv[0] + " myexport.ics 20210101 20210201")
|
||||
print(sys.argv[0] + " myexport.ics 2021-01-01T00:00:00 2021-01-31T23:59:59\n")
|
||||
print("NOTE: If you need data in another timezone than the system is set to, override like this before running the script:")
|
||||
print("export TZ=\"Europe/Copenhagen\"\n")
|
||||
exit(1)
|
||||
|
||||
filename = sys.argv[1]
|
||||
# TODO: use regex to get file extension (chars after last period), in case it's not exactly 3 chars.
|
||||
file_extension = str(sys.argv[1])[-3:]
|
||||
@ -25,6 +41,24 @@ class CalendarEvent:
|
||||
|
||||
events = []
|
||||
|
||||
def removehtml(html):
|
||||
# Almost word for word copy from here: https://stackoverflow.com/questions/328356/extracting-text-from-html-file-using-python
|
||||
|
||||
soup = BeautifulSoup(html, features="html.parser")
|
||||
# kill all script and style elements
|
||||
for script in soup(["script", "style"]):
|
||||
script.extract() # remove it
|
||||
|
||||
text = soup.get_text() # Get plain text
|
||||
|
||||
# break into lines and remove leading and trailing space on each
|
||||
lines = (line.strip() for line in text.splitlines())
|
||||
# break multi-headlines into a line each
|
||||
chunks = (phrase.strip() for line in lines for phrase in line.split(" "))
|
||||
# drop blank lines
|
||||
text = '\n'.join(chunk for chunk in chunks if chunk)
|
||||
|
||||
return text
|
||||
|
||||
def open_cal():
|
||||
if os.path.isfile(filename):
|
||||
@ -32,24 +66,33 @@ def open_cal():
|
||||
print("Extracting events from file:", filename, "\n")
|
||||
f = open(sys.argv[1], 'rb')
|
||||
gcal = Calendar.from_ical(f.read())
|
||||
revents = recurring_ical_events.of(gcal).between(istart,istop)
|
||||
|
||||
for component in gcal.walk():
|
||||
# for component in gcal.walk():
|
||||
for component in revents:
|
||||
event = CalendarEvent("event")
|
||||
if component.get('TRANSP') == 'TRANSPARENT': continue #skip event that have not been accepted
|
||||
if component.get('SUMMARY') == None: continue #skip blank items
|
||||
event.summary = component.get('SUMMARY')
|
||||
event.uid = component.get('UID')
|
||||
if component.get('DESCRIPTION') == None: continue #skip blank items
|
||||
event.description = component.get('DESCRIPTION')
|
||||
event.location = component.get('LOCATION')
|
||||
if hasattr(component.get('dtstart'), 'dt'):
|
||||
event.start = component.get('dtstart').dt
|
||||
if hasattr(component.get('dtend'), 'dt'):
|
||||
event.end = component.get('dtend').dt
|
||||
v=(dir(component).count('get')) # Only proces data if object is a valid event
|
||||
if (v != 0):
|
||||
if component.get('TRANSP') == 'TRANSPARENT': continue #skip all day events and the like
|
||||
if component.get('SUMMARY') == None: continue #skip blank items
|
||||
event.summary = component.get('SUMMARY')
|
||||
event.uid = component.get('UID')
|
||||
if component.get('DESCRIPTION') == None: continue #skip blank items
|
||||
event.description = component.get('DESCRIPTION')
|
||||
event.location = component.get('LOCATION')
|
||||
if hasattr(component.get('dtstart'), 'dt'):
|
||||
event.start = component.get('dtstart').dt
|
||||
if hasattr(component.get('dtend'), 'dt'):
|
||||
event.end = component.get('dtend').dt
|
||||
|
||||
|
||||
event.url = component.get('URL')
|
||||
events.append(event)
|
||||
if type(now) != type(event.start): # If we get a datetime.date object, convert to datetime.datetime
|
||||
event.start=datetime.datetime.combine(event.start, datetime.time.min)
|
||||
if type(now) != type(event.end): # If we get a datetime.date object, convert to datetime.datetime
|
||||
event.end=datetime.datetime.combine(event.end, datetime.time.max)
|
||||
event.start = event.start.astimezone()
|
||||
event.end = event.end.astimezone()
|
||||
event.url = component.get('URL')
|
||||
events.append(event)
|
||||
f.close()
|
||||
else:
|
||||
print("You entered ", filename, ". ")
|
||||
@ -63,14 +106,21 @@ def open_cal():
|
||||
|
||||
def csv_write(icsfile):
|
||||
csvfile = icsfile[:-3] + "csv"
|
||||
spent=0
|
||||
evcount=0
|
||||
evskip=0
|
||||
sys.stdout.write("Processing events : ")
|
||||
try:
|
||||
with open(csvfile, 'w') as myfile:
|
||||
wr = csv.writer(myfile, quoting=csv.QUOTE_ALL)
|
||||
wr.writerow(headers)
|
||||
for event in sortedevents:
|
||||
values = (event.summary.encode('utf8').decode(), event.uid, event.description.encode('utf8').decode(), event.location, event.start, event.end, event.url)
|
||||
values = (event.summary.encode('utf-8').decode(), event.uid, removehtml(event.description.encode('utf-8').decode()), event.location.encode('utf-8').decode(), event.start, event.end, event.url)
|
||||
wr.writerow(values)
|
||||
print("Wrote to ", csvfile, "\n")
|
||||
sys.stdout.write(".")
|
||||
sys.stdout.flush()
|
||||
evcount+=1
|
||||
print("\n\nWrote " + str(evcount) + " events to ", csvfile, "\n")
|
||||
except IOError:
|
||||
print("Could not open file! Please close Excel!")
|
||||
exit(0)
|
||||
@ -86,7 +136,19 @@ def debug_event(class_name):
|
||||
print(class_name.end)
|
||||
print(class_name.url, "\n")
|
||||
|
||||
open_cal()
|
||||
sortedevents=sorted(events, key=lambda obj: obj.start) # Needed to sort events. They are not fully chronological in a Google Calendard export ...
|
||||
now=datetime.datetime.now()
|
||||
istart=datetime.datetime.fromtimestamp(0) # Start of UNIX epoch (1970-01-01T00:00:00)
|
||||
istop=now+datetime.timedelta(seconds=157680000) # Stop 5 years in the future, if no enddate is given, to make sure reucurring events don't go on forever ...
|
||||
|
||||
if len(sys.argv) > 3:
|
||||
if sys.argv[2] != '':
|
||||
istart=parse(sys.argv[2])
|
||||
if sys.argv[3] != '':
|
||||
istop=parse(sys.argv[3])
|
||||
|
||||
print("Opening ics file\n")
|
||||
open_cal() # Open ics file and do initial parsing of events
|
||||
print("Sorting events\n")
|
||||
sortedevents=sorted(events, key=lambda obj: obj.start) # Make sure events are in chronological order
|
||||
csv_write(filename)
|
||||
#debug_event(event)
|
||||
|
Loading…
Reference in New Issue
Block a user