Up our debugging game significantly by not making the rookie equals assignment object mistake
This commit is contained in:
parent
baee9b5087
commit
306b61055f
2 changed files with 35 additions and 14 deletions
|
@ -6,34 +6,52 @@ import sys
|
||||||
# Import our local settings management.
|
# Import our local settings management.
|
||||||
import settings
|
import settings
|
||||||
|
|
||||||
|
if not hasattr(sys, 'ps1'):
|
||||||
|
import copy
|
||||||
|
debug = True
|
||||||
|
else:
|
||||||
|
debug = False
|
||||||
|
|
||||||
# This works for one file:
|
# This works for one file:
|
||||||
# timelog = pd.read_csv(settings.pomodoro_logfile())
|
timelog = pd.read_csv(settings.pomodoro_logfile())
|
||||||
|
|
||||||
# For multiple files:
|
# For multiple files:
|
||||||
path = settings.pomodoro_logpath()
|
#path = settings.pomodoro_logpath()
|
||||||
all_files = glob.glob(path + "*.csv")
|
#all_files = glob.glob(path + "*.csv")
|
||||||
|
#
|
||||||
|
#li = []
|
||||||
|
#
|
||||||
|
#for filename in all_files:
|
||||||
|
# df = pd.read_csv(filename, index_col=None, header=0)
|
||||||
|
# li.append(df)
|
||||||
|
|
||||||
li = []
|
# timelog = pd.concat(li, axis=0, ignore_index=True)
|
||||||
|
|
||||||
for filename in all_files:
|
if debug:
|
||||||
df = pd.read_csv(filename, index_col=None, header=0)
|
imported = copy.deepcopy(timelog)
|
||||||
li.append(df)
|
|
||||||
|
|
||||||
timelog = pd.concat(li, axis=0, ignore_index=True)
|
|
||||||
|
|
||||||
timelog.drop_duplicates(inplace=True)
|
timelog.drop_duplicates(inplace=True)
|
||||||
|
|
||||||
|
if debug:
|
||||||
|
nodupes = copy.deepcopy(timelog)
|
||||||
|
|
||||||
# Dump bad data. The real solution here is to get rid of the damned 'Cancel'
|
# Dump bad data. The real solution here is to get rid of the damned 'Cancel'
|
||||||
# button on the Pomodoro Prompt dialog, but i don't know how to do that, so we
|
# button on the Pomodoro Prompt dialog, but i don't know how to do that, so we
|
||||||
# need to drop the rows where the work task description is blank, which is
|
# need to drop the rows where the work task description is blank, which is
|
||||||
# coming in as not a number for reasons i'm not entirely clear on. Maybe
|
# coming in as not a number for reasons i'm not entirely clear on. Maybe
|
||||||
# because it's the last row of the spreadsheet? Anyway we cannot do anything
|
# because it's the last row of the spreadsheet? Anyway we cannot do anything
|
||||||
# with no data in the description, so drop them at the outset.
|
# with no data in the description, so drop them at the outset.
|
||||||
timelog = timelog.dropna()
|
# We can allow no data in the 'intention' so define the three columns to check:
|
||||||
|
timelog = timelog.dropna(subset=['started', 'recorded', 'description'])
|
||||||
timelog = timelog.reset_index(drop=True)
|
timelog = timelog.reset_index(drop=True)
|
||||||
|
|
||||||
# For debugging, keep original description around.
|
if debug:
|
||||||
timelog["orig_desc"] = timelog["description"]
|
dropna = copy.deepcopy(timelog)
|
||||||
|
|
||||||
|
# For debugging, keep originals around.
|
||||||
|
timelog["orig_desc"] = timelog["description"]
|
||||||
|
timelog["orig_started"] = timelog["started"]
|
||||||
|
timelog["orig_recorded"] = timelog["recorded"]
|
||||||
|
|
||||||
# Clean up description before we go to work on it.
|
# Clean up description before we go to work on it.
|
||||||
timelog['description'] = timelog['description'].str.strip()
|
timelog['description'] = timelog['description'].str.strip()
|
||||||
|
@ -44,6 +62,9 @@ timelog['description'] = timelog['description'].str.strip()
|
||||||
timelog["description"] = list(timelog["description"].str.split(";"))
|
timelog["description"] = list(timelog["description"].str.split(";"))
|
||||||
timelog = timelog.explode("description").reset_index()
|
timelog = timelog.explode("description").reset_index()
|
||||||
|
|
||||||
|
if debug:
|
||||||
|
mess = copy.deepcopy(timelog)
|
||||||
|
|
||||||
timelog["started"] = pd.to_datetime(timelog["started"]).dt.tz_convert("US/Eastern")
|
timelog["started"] = pd.to_datetime(timelog["started"]).dt.tz_convert("US/Eastern")
|
||||||
timelog["recorded"] = pd.to_datetime(timelog["recorded"]).dt.tz_convert("US/Eastern")
|
timelog["recorded"] = pd.to_datetime(timelog["recorded"]).dt.tz_convert("US/Eastern")
|
||||||
|
|
||||||
|
@ -112,7 +133,7 @@ for preferred, alternatives in replacement_project_names.items():
|
||||||
# The fillna is essential or we drop entries with blank ('None') projects.
|
# The fillna is essential or we drop entries with blank ('None') projects.
|
||||||
tl = timelog.groupby(["date", timelog.project.fillna(""), "description"]).agg({"time": 'sum', "started": 'min', "recorded": 'max'}).reset_index()
|
tl = timelog.groupby(["date", timelog.project.fillna(""), "description"]).agg({"time": 'sum', "started": 'min', "recorded": 'max'}).reset_index()
|
||||||
|
|
||||||
if not hasattr(sys, 'ps1'):
|
if debug:
|
||||||
tl.to_csv('harvest-ready.csv', index=False)
|
tl.to_csv('harvest-ready.csv', index=False)
|
||||||
settings.pomodoro_latest_recorded(tl.recorded.max())
|
settings.pomodoro_latest_recorded(tl.recorded.max())
|
||||||
else:
|
else:
|
||||||
|
|
|
@ -14,7 +14,7 @@ def write():
|
||||||
|
|
||||||
if not os.path.isfile('settings.ini'):
|
if not os.path.isfile('settings.ini'):
|
||||||
# Set some essential initial values.
|
# Set some essential initial values.
|
||||||
# pomodoro['logfile'] = '~/Projects/agaric/python/pomodoroprompt/log/2021.csv'
|
pomodoro['logfile'] = '~/Projects/agaric/python/pomodoroprompt/log/timelog.csv'
|
||||||
# This path must be absolute, for some reason using ~ for home isn t wor::
|
# This path must be absolute, for some reason using ~ for home isn t wor::
|
||||||
pomodoro['logpath'] = '/home/mlncn/Projects/agaric/python/pomodoroprompt/log/'
|
pomodoro['logpath'] = '/home/mlncn/Projects/agaric/python/pomodoroprompt/log/'
|
||||||
write()
|
write()
|
||||||
|
|
Loading…
Reference in a new issue