Compare commits
30 Commits
nilmdb-2.0
...
master
Author | SHA1 | Date | |
---|---|---|---|
517b237636 | |||
07f138e0f4 | |||
7538c6201b | |||
4d9a106ca1 | |||
e90a79ddad | |||
7056c5b4ec | |||
df4e7f0967 | |||
b6bba16505 | |||
d4003d0d34 | |||
759492298a | |||
b5f6fcc253 | |||
905e325ded | |||
648b6f4b70 | |||
7f8a2c7027 | |||
276fbc652a | |||
10b34f5937 | |||
83daeb148a | |||
d65f00e8b2 | |||
71dc01c9a7 | |||
bcd21b3498 | |||
a1dee0e6f2 | |||
99ac47cf0d | |||
4cdaef51c1 | |||
88466dcafe | |||
8dfb8da15c | |||
6cc1f6b7b2 | |||
8dc36c2d37 | |||
3738430103 | |||
a41111b045 | |||
85f822e1c4 |
|
@ -1,7 +1,7 @@
|
|||
# nilmdb: Non-Intrusive Load Monitor Database
|
||||
by Jim Paris <jim@jtan.com>
|
||||
|
||||
NilmDB requires Python 3.7 or newer.
|
||||
NilmDB requires Python 3.8 or newer.
|
||||
|
||||
## Prerequisites:
|
||||
|
||||
|
|
|
@ -1,4 +1,4 @@
|
|||
#!/usr/bin/python
|
||||
#!/usr/bin/env python3
|
||||
|
||||
import os
|
||||
import sys
|
||||
|
|
|
@ -145,8 +145,8 @@ class Client():
|
|||
|
||||
Example:
|
||||
with client.stream_insert_context('/path', start, end) as ctx:
|
||||
ctx.insert('1234567890.0 1 2 3 4\\n')
|
||||
ctx.insert('1234567891.0 1 2 3 4\\n')
|
||||
ctx.insert('1234567890000000 1 2 3 4\\n')
|
||||
ctx.insert('1234567891000000 1 2 3 4\\n')
|
||||
|
||||
For more details, see help for nilmdb.client.client.StreamInserter
|
||||
|
||||
|
|
|
@ -109,7 +109,7 @@ class HTTPClient():
|
|||
stream=False, headers=headers)
|
||||
if isjson:
|
||||
return json.loads(response.content)
|
||||
return response.content
|
||||
return response.text
|
||||
|
||||
def get(self, url, params=None):
|
||||
"""Simple GET (parameters in URL)"""
|
||||
|
|
|
@ -59,7 +59,7 @@ class NumpyClient(nilmdb.client.client.Client):
|
|||
dtype = self._get_dtype(path, layout)
|
||||
|
||||
def to_numpy(data):
|
||||
a = numpy.fromstring(data, dtype)
|
||||
a = numpy.frombuffer(data, dtype)
|
||||
if structured:
|
||||
return a
|
||||
return numpy.c_[a['timestamp'], a['data']]
|
||||
|
|
|
@ -66,7 +66,7 @@ class Complete():
|
|||
layouts = []
|
||||
for i in range(1, 10):
|
||||
layouts.extend([(t + "_" + str(i)) for t in types])
|
||||
return (l for l in layouts if l.startswith(prefix))
|
||||
return (lay for lay in layouts if lay.startswith(prefix))
|
||||
|
||||
def meta_key(self, prefix, parsed_args, **kwargs):
|
||||
return (kv.split('=')[0] for kv
|
||||
|
|
|
@ -1,7 +1,5 @@
|
|||
# -*- coding: utf-8 -*-
|
||||
|
||||
raise Exception("todo: fix path bytes issues")
|
||||
|
||||
"""Check database consistency, with some ability to fix problems.
|
||||
This should be able to fix cases where a database gets corrupted due
|
||||
to unexpected system shutdown, and detect other cases that may cause
|
||||
|
@ -13,7 +11,6 @@ import nilmdb.client.numpyclient
|
|||
from nilmdb.utils.interval import IntervalError
|
||||
from nilmdb.server.interval import Interval, IntervalSet
|
||||
from nilmdb.utils.printf import printf, fprintf, sprintf
|
||||
from nilmdb.utils.time import timestamp_to_string
|
||||
|
||||
from collections import defaultdict
|
||||
import sqlite3
|
||||
|
@ -21,44 +18,55 @@ import os
|
|||
import sys
|
||||
import progressbar
|
||||
import re
|
||||
import time
|
||||
import shutil
|
||||
import pickle
|
||||
import numpy
|
||||
|
||||
|
||||
class FsckError(Exception):
|
||||
def __init__(self, msg="", *args):
|
||||
if args:
|
||||
msg = sprintf(msg, *args)
|
||||
Exception.__init__(self, msg)
|
||||
|
||||
|
||||
class FixableFsckError(FsckError):
|
||||
def __init__(self, msg = "", *args):
|
||||
if args:
|
||||
msg = sprintf(msg, *args)
|
||||
FsckError.__init__(self, "%s\nThis may be fixable with \"--fix\".", msg)
|
||||
def __init__(self, msg=""):
|
||||
FsckError.__init__(self, f'{msg}\nThis may be fixable with "--fix".')
|
||||
|
||||
|
||||
class RetryFsck(FsckError):
|
||||
pass
|
||||
|
||||
|
||||
class FsckFormatError(FsckError):
|
||||
pass
|
||||
|
||||
|
||||
def log(format, *args):
|
||||
printf(format, *args)
|
||||
|
||||
|
||||
def err(format, *args):
|
||||
fprintf(sys.stderr, format, *args)
|
||||
|
||||
|
||||
# Decorator that retries a function if it returns a specific value
|
||||
def retry_if_raised(exc, message = None, max_retries = 100):
|
||||
def retry_if_raised(exc, message=None, max_retries=1000):
|
||||
def f1(func):
|
||||
def f2(*args, **kwargs):
|
||||
for n in range(max_retries):
|
||||
try:
|
||||
return func(*args, **kwargs)
|
||||
except exc as e:
|
||||
except exc:
|
||||
if message:
|
||||
log("%s\n\n", message)
|
||||
raise Exception("Max number of retries (%d) exceeded; giving up")
|
||||
log(f"{message} ({n+1})\n\n")
|
||||
raise Exception("Max number of retries (%d) exceeded; giving up" %
|
||||
max_retries)
|
||||
return f2
|
||||
return f1
|
||||
|
||||
|
||||
class Progress(object):
|
||||
def __init__(self, maxval):
|
||||
if maxval == 0:
|
||||
|
@ -68,22 +76,24 @@ class Progress(object):
|
|||
widgets=[progressbar.Percentage(), ' ',
|
||||
progressbar.Bar(), ' ',
|
||||
progressbar.ETA()])
|
||||
if self.bar.term_width == 0:
|
||||
self.bar.term_width = 75
|
||||
self.bar.term_width = self.bar.term_width or 75
|
||||
|
||||
def __enter__(self):
|
||||
self.bar.start()
|
||||
self.last_update = 0
|
||||
return self
|
||||
|
||||
def __exit__(self, exc_type, exc_value, traceback):
|
||||
if exc_type is None:
|
||||
self.bar.finish()
|
||||
else:
|
||||
printf("\n")
|
||||
|
||||
def update(self, val):
|
||||
self.bar.update(val)
|
||||
|
||||
class Fsck(object):
|
||||
|
||||
class Fsck(object):
|
||||
def __init__(self, path, fix=False):
|
||||
self.basepath = path
|
||||
self.sqlpath = os.path.join(path, "data.sql")
|
||||
|
@ -109,7 +119,9 @@ class Fsck(object):
|
|||
finally:
|
||||
if self.bulk:
|
||||
self.bulk.close()
|
||||
if self.sql:
|
||||
if self.sql: # pragma: no cover
|
||||
# (coverage doesn't handle finally clauses correctly;
|
||||
# both branches here are tested)
|
||||
self.sql.commit()
|
||||
self.sql.close()
|
||||
log("ok\n")
|
||||
|
@ -164,7 +176,7 @@ class Fsck(object):
|
|||
"ORDER BY start_time")
|
||||
for r in result:
|
||||
if r[0] not in self.stream_path:
|
||||
raise FsckError("interval ID %d not in streams", k)
|
||||
raise FsckError("interval ID %d not in streams", r[0])
|
||||
self.stream_interval[r[0]].append((r[1], r[2], r[3], r[4]))
|
||||
|
||||
log(" loading metadata\n")
|
||||
|
@ -172,9 +184,10 @@ class Fsck(object):
|
|||
result = cur.execute("SELECT stream_id, key, value FROM metadata")
|
||||
for r in result:
|
||||
if r[0] not in self.stream_path:
|
||||
raise FsckError("metadata ID %d not in streams", k)
|
||||
raise FsckError("metadata ID %d not in streams", r[0])
|
||||
if r[1] in self.stream_meta[r[0]]:
|
||||
raise FsckError("duplicate metadata key '%s' for stream %d",
|
||||
raise FsckError(
|
||||
"duplicate metadata key '%s' for stream %d",
|
||||
r[1], r[0])
|
||||
self.stream_meta[r[0]][r[1]] = r[2]
|
||||
|
||||
|
@ -202,6 +215,7 @@ class Fsck(object):
|
|||
|
||||
# must exist in bulkdata
|
||||
bulk = self.bulkpath + path
|
||||
bulk = bulk.encode('utf-8')
|
||||
if not os.path.isdir(bulk):
|
||||
raise FsckError("%s: missing bulkdata dir", path)
|
||||
if not nilmdb.server.bulkdata.Table.exists(bulk):
|
||||
|
@ -224,39 +238,97 @@ class Fsck(object):
|
|||
try:
|
||||
posiset += new
|
||||
except IntervalError:
|
||||
raise FsckError("%s: overlap in file offsets:\n"
|
||||
"set: %s\nnew: %s",
|
||||
path, str(posiset), str(new))
|
||||
self.fix_row_overlap(sid, path, posiset, new)
|
||||
|
||||
# check bulkdata
|
||||
try:
|
||||
# Check bulkdata
|
||||
self.check_bulkdata(sid, path, bulk)
|
||||
|
||||
# Check that we can open bulkdata
|
||||
try:
|
||||
tab = None
|
||||
try:
|
||||
tab = nilmdb.server.bulkdata.Table(bulk)
|
||||
except Exception as e:
|
||||
except FsckFormatError:
|
||||
# If there are no files except _format, try deleting
|
||||
# the entire stream; this may remove metadata, but
|
||||
# it's probably unimportant.
|
||||
files = list(os.listdir(bulk))
|
||||
if len(files) > 1:
|
||||
raise FsckFormatError(f"{path}: can't load _format, "
|
||||
f"but data is also present")
|
||||
|
||||
# Since the stream was empty, just remove it
|
||||
self.fix_remove_stream(sid, path, bulk,
|
||||
"empty, with corrupted format file")
|
||||
except FsckError as e:
|
||||
raise e
|
||||
except Exception as e: # pragma: no cover
|
||||
# No coverage because this is an unknown/unexpected error
|
||||
raise FsckError("%s: can't open bulkdata: %s",
|
||||
path, str(e))
|
||||
finally:
|
||||
if tab:
|
||||
tab.close()
|
||||
|
||||
def fix_row_overlap(self, sid, path, existing, new):
|
||||
# If the file rows (spos, epos) overlap in the interval table,
|
||||
# and the overlapping ranges look like this:
|
||||
# A --------- C
|
||||
# B -------- D
|
||||
# Then we can try changing the first interval to go from
|
||||
# A to B instead.
|
||||
msg = (f"{path}: overlap in file offsets:\n"
|
||||
f"existing ranges: {existing}\n"
|
||||
f"overlapping interval: {new}")
|
||||
if not self.fix:
|
||||
raise FixableFsckError(msg)
|
||||
err(f"\n{msg}\nSeeing if we can truncate one of them...\n")
|
||||
|
||||
# See if there'e exactly one interval that overlaps the
|
||||
# conflicting one in the right way
|
||||
match = None
|
||||
for intv in self.stream_interval[sid]:
|
||||
(stime, etime, spos, epos) = intv
|
||||
if spos < new.start and epos > new.start:
|
||||
if match:
|
||||
err(f"no, more than one interval matched:\n"
|
||||
f"{intv}\n{match}\n")
|
||||
raise FsckError(f"{path}: unfixable overlap")
|
||||
match = intv
|
||||
if match is None:
|
||||
err("no intervals overlapped in the right way\n")
|
||||
raise FsckError(f"{path}: unfixable overlap")
|
||||
|
||||
# Truncate the file position
|
||||
err(f"truncating {match}\n")
|
||||
with self.sql:
|
||||
cur = self.sql.cursor()
|
||||
cur.execute("UPDATE ranges SET end_pos=? "
|
||||
"WHERE stream_id=? AND start_time=? AND "
|
||||
"end_time=? AND start_pos=? AND end_pos=?",
|
||||
(new.start, sid, *match))
|
||||
if cur.rowcount != 1: # pragma: no cover (shouldn't fail)
|
||||
raise FsckError("failed to fix SQL database")
|
||||
raise RetryFsck
|
||||
|
||||
### Check that bulkdata is good enough to be opened
|
||||
|
||||
@retry_if_raised(RetryFsck)
|
||||
def check_bulkdata(self, sid, path, bulk):
|
||||
with open(os.path.join(bulk, "_format"), "rb") as f:
|
||||
try:
|
||||
with open(os.path.join(bulk, b"_format"), "rb") as f:
|
||||
fmt = pickle.load(f)
|
||||
except Exception as e:
|
||||
raise FsckFormatError(f"{path}: can't load _format file ({e})")
|
||||
|
||||
if fmt["version"] != 3:
|
||||
raise FsckError("%s: bad or unsupported bulkdata version %d",
|
||||
raise FsckFormatError("%s: bad or unsupported bulkdata version %d",
|
||||
path, fmt["version"])
|
||||
row_per_file = int(fmt["rows_per_file"])
|
||||
rows_per_file = int(fmt["rows_per_file"])
|
||||
if rows_per_file < 1:
|
||||
raise FsckFormatError(f"{path}: bad rows_per_file {rows_per_file}")
|
||||
files_per_dir = int(fmt["files_per_dir"])
|
||||
if files_per_dir < 1:
|
||||
raise FsckFormatError(f"{path}: bad files_per_dir {files_per_dir}")
|
||||
layout = fmt["layout"]
|
||||
if layout != self.stream_layout[sid]:
|
||||
raise FsckError("%s: layout mismatch %s != %s", path,
|
||||
raise FsckFormatError("%s: layout mismatch %s != %s", path,
|
||||
layout, self.stream_layout[sid])
|
||||
|
||||
# Every file should have a size that's the multiple of the row size
|
||||
|
@ -265,7 +337,7 @@ class Fsck(object):
|
|||
rkt.close()
|
||||
|
||||
# Find all directories
|
||||
regex = re.compile("^[0-9a-f]{4,}$")
|
||||
regex = re.compile(b"^[0-9a-f]{4,}$")
|
||||
subdirs = sorted(filter(regex.search, os.listdir(bulk)),
|
||||
key=lambda x: int(x, 16), reverse=True)
|
||||
for subdir in subdirs:
|
||||
|
@ -274,7 +346,7 @@ class Fsck(object):
|
|||
files = list(filter(regex.search, os.listdir(subpath)))
|
||||
if not files:
|
||||
self.fix_empty_subdir(subpath)
|
||||
raise RetryFsck
|
||||
|
||||
# Verify that their size is a multiple of the row size
|
||||
for filename in files:
|
||||
filepath = os.path.join(subpath, filename)
|
||||
|
@ -290,10 +362,11 @@ class Fsck(object):
|
|||
# as long as it's only ".removed" files.
|
||||
err("\n%s\n", msg)
|
||||
for fn in os.listdir(subpath):
|
||||
if not fn.endswith(".removed"):
|
||||
if not fn.endswith(b".removed"):
|
||||
raise FsckError("can't fix automatically: please manually "
|
||||
"remove the file %s and try again",
|
||||
os.path.join(subpath, fn))
|
||||
"remove the file '%s' and try again",
|
||||
os.path.join(subpath, fn).decode(
|
||||
'utf-8', errors='backslashreplace'))
|
||||
# Remove the whole thing
|
||||
err("Removing empty subpath\n")
|
||||
shutil.rmtree(subpath)
|
||||
|
@ -314,6 +387,24 @@ class Fsck(object):
|
|||
f.truncate(newsize)
|
||||
raise RetryFsck
|
||||
|
||||
def fix_remove_stream(self, sid, path, bulk, reason):
|
||||
msg = f"stream {path} is corrupted: {reason}"
|
||||
if not self.fix:
|
||||
raise FixableFsckError(msg)
|
||||
# Remove the stream from disk and the database
|
||||
err(f"\n{msg}\n")
|
||||
err(f"Removing stream {path} from disk and database\n")
|
||||
shutil.rmtree(bulk)
|
||||
with self.sql:
|
||||
cur = self.sql.cursor()
|
||||
cur.execute("DELETE FROM streams WHERE id=?",
|
||||
(sid,))
|
||||
if cur.rowcount != 1: # pragma: no cover (shouldn't fail)
|
||||
raise FsckError("failed to remove stream")
|
||||
cur.execute("DELETE FROM ranges WHERE stream_id=?", (sid,))
|
||||
cur.execute("DELETE FROM metadata WHERE stream_id=?", (sid,))
|
||||
raise RetryFsck
|
||||
|
||||
### Check interval endpoints
|
||||
|
||||
def check_intervals(self):
|
||||
|
@ -324,9 +415,12 @@ class Fsck(object):
|
|||
for sid in self.stream_interval:
|
||||
try:
|
||||
bulk = self.bulkpath + self.stream_path[sid]
|
||||
bulk = bulk.encode('utf-8')
|
||||
tab = nilmdb.server.bulkdata.Table(bulk)
|
||||
|
||||
def update(x):
|
||||
pbar.update(done + x)
|
||||
|
||||
ints = self.stream_interval[sid]
|
||||
done += self.check_table_intervals(sid, ints, tab, update)
|
||||
finally:
|
||||
|
@ -335,7 +429,7 @@ class Fsck(object):
|
|||
def check_table_intervals(self, sid, ints, tab, update):
|
||||
# look in the table to make sure we can pick out the interval's
|
||||
# endpoints
|
||||
path = self.stream_path[sid]
|
||||
path = self.stream_path[sid] # noqa: F841 unused
|
||||
tab.file_open.cache_remove_all()
|
||||
for (i, intv) in enumerate(ints):
|
||||
update(i)
|
||||
|
@ -343,11 +437,11 @@ class Fsck(object):
|
|||
if spos == epos and spos >= 0 and spos <= tab.nrows:
|
||||
continue
|
||||
try:
|
||||
srow = tab[spos]
|
||||
erow = tab[epos-1]
|
||||
srow = tab[spos] # noqa: F841 unused
|
||||
erow = tab[epos-1] # noqa: F841 unused
|
||||
except Exception as e:
|
||||
self.fix_bad_interval(sid, intv, tab, str(e))
|
||||
raise RetryFsck
|
||||
|
||||
return len(ints)
|
||||
|
||||
def fix_bad_interval(self, sid, intv, tab, msg):
|
||||
|
@ -376,23 +470,23 @@ class Fsck(object):
|
|||
"end_time=? AND start_pos=? AND end_pos=?",
|
||||
(new_etime, new_epos, sid, stime, etime,
|
||||
spos, epos))
|
||||
if cur.rowcount != 1:
|
||||
if cur.rowcount != 1: # pragma: no cover (shouldn't fail)
|
||||
raise FsckError("failed to fix SQL database")
|
||||
raise RetryFsck
|
||||
err("actually it can't be truncated; times are bad too")
|
||||
err("actually it can't be truncated; times are bad too\n")
|
||||
|
||||
# Otherwise, the only hope is to delete the interval entirely.
|
||||
err("*** Deleting the entire interval from SQL.\n")
|
||||
err("This may leave stale data on disk. To fix that, copy all\n")
|
||||
err("data from this stream to a new stream, then remove all data\n")
|
||||
err("from and destroy %s.\n", path)
|
||||
err("This may leave stale data on disk. To fix that, copy all "
|
||||
"data from this stream to a new stream using nilm-copy, then\n")
|
||||
err("remove all data from and destroy %s.\n", path)
|
||||
with self.sql:
|
||||
cur = self.sql.cursor()
|
||||
cur.execute("DELETE FROM ranges WHERE "
|
||||
"stream_id=? AND start_time=? AND "
|
||||
"end_time=? AND start_pos=? AND end_pos=?",
|
||||
(sid, stime, etime, spos, epos))
|
||||
if cur.rowcount != 1:
|
||||
if cur.rowcount != 1: # pragma: no cover (shouldn't fail)
|
||||
raise FsckError("failed to remove interval")
|
||||
raise RetryFsck
|
||||
|
||||
|
@ -407,9 +501,12 @@ class Fsck(object):
|
|||
for sid in self.stream_interval:
|
||||
try:
|
||||
bulk = self.bulkpath + self.stream_path[sid]
|
||||
bulk = bulk.encode('utf-8')
|
||||
tab = nilmdb.server.bulkdata.Table(bulk)
|
||||
|
||||
def update(x):
|
||||
pbar.update(done + x)
|
||||
|
||||
ints = self.stream_interval[sid]
|
||||
done += self.check_table_data(sid, ints, tab, update)
|
||||
finally:
|
||||
|
@ -418,7 +515,7 @@ class Fsck(object):
|
|||
def check_table_data(self, sid, ints, tab, update):
|
||||
# Pull out all of the interval's data and verify that it's
|
||||
# monotonic.
|
||||
maxrows = 100000
|
||||
maxrows = getattr(self, 'maxrows_override', 100000)
|
||||
path = self.stream_path[sid]
|
||||
layout = self.stream_layout[sid]
|
||||
dtype = nilmdb.client.numpyclient.layout_to_dtype(layout)
|
||||
|
@ -439,28 +536,75 @@ class Fsck(object):
|
|||
# Get raw data, convert to NumPy arary
|
||||
try:
|
||||
raw = tab.get_data(start, stop, binary=True)
|
||||
data = numpy.fromstring(raw, dtype)
|
||||
except Exception as e:
|
||||
raise FsckError("%s: failed to grab rows %d through %d: %s",
|
||||
data = numpy.frombuffer(raw, dtype)
|
||||
except Exception as e: # pragma: no cover
|
||||
# No coverage because it's hard to trigger this -- earlier
|
||||
# checks check the ranges, so this would probably be a real
|
||||
# disk error, malloc failure, etc.
|
||||
raise FsckError(
|
||||
"%s: failed to grab rows %d through %d: %s",
|
||||
path, start, stop, repr(e))
|
||||
|
||||
ts = data['timestamp']
|
||||
|
||||
# Verify that all timestamps are in range.
|
||||
match = (ts < stime) | (ts >= etime)
|
||||
if match.any():
|
||||
row = numpy.argmax(match)
|
||||
if ts[row] != 0:
|
||||
raise FsckError("%s: data timestamp %d at row %d "
|
||||
"outside interval range [%d,%d)",
|
||||
path, ts[row], row + start,
|
||||
stime, etime)
|
||||
|
||||
# Timestamp is zero and out of the expected range;
|
||||
# assume file ends with zeroed data and just truncate it.
|
||||
self.fix_table_by_truncating(
|
||||
path, tab, row + start,
|
||||
"data timestamp is out of range, and zero")
|
||||
|
||||
# Verify that timestamps are monotonic
|
||||
if (numpy.diff(data['timestamp']) <= 0).any():
|
||||
raise FsckError("%s: non-monotonic timestamp(s) in rows "
|
||||
"%d through %d", path, start, stop)
|
||||
first_ts = data['timestamp'][0]
|
||||
match = numpy.diff(ts) <= 0
|
||||
if match.any():
|
||||
row = numpy.argmax(match)
|
||||
if ts[row+1] != 0:
|
||||
raise FsckError(
|
||||
"%s: non-monotonic timestamp (%d -> %d) "
|
||||
"at row %d", path, ts[row], ts[row+1],
|
||||
row + start)
|
||||
|
||||
# Timestamp is zero and non-monotonic;
|
||||
# assume file ends with zeroed data and just truncate it.
|
||||
self.fix_table_by_truncating(
|
||||
path, tab, row + start + 1,
|
||||
"data timestamp is non-monotonic, and zero")
|
||||
|
||||
first_ts = ts[0]
|
||||
if last_ts is not None and first_ts <= last_ts:
|
||||
raise FsckError("%s: first interval timestamp %d is not "
|
||||
"greater than the previous last interval "
|
||||
"timestamp %d, at row %d",
|
||||
path, first_ts, last_ts, start)
|
||||
last_ts = data['timestamp'][-1]
|
||||
last_ts = ts[-1]
|
||||
|
||||
# These are probably fixable, by removing the offending
|
||||
# intervals. But I'm not going to bother implementing
|
||||
# that yet.
|
||||
# The previous errors are fixable, by removing the
|
||||
# offending intervals, or changing the data
|
||||
# timestamps. But these are probably unlikely errors,
|
||||
# so it's not worth implementing that yet.
|
||||
|
||||
# Done
|
||||
done += count
|
||||
update(done)
|
||||
return done
|
||||
|
||||
def fix_table_by_truncating(self, path, tab, row, reason):
|
||||
# Simple fix for bad data: truncate the table at the given row.
|
||||
# On retry, fix_bad_interval will correct the database and timestamps
|
||||
# to account for this truncation.
|
||||
msg = f"{path}: bad data in table, starting at row {row}: {reason}"
|
||||
if not self.fix:
|
||||
raise FixableFsckError(msg)
|
||||
err(f"\n{msg}\nWill try truncating table\n")
|
||||
(subdir, fname, offs, count) = tab._offset_from_row(row)
|
||||
tab._remove_or_truncate_file(subdir, fname, offs)
|
||||
raise RetryFsck
|
||||
|
|
|
@ -1,9 +1,8 @@
|
|||
#!/usr/bin/python
|
||||
#!/usr/bin/env python3
|
||||
|
||||
import nilmdb.fsck
|
||||
import argparse
|
||||
import os
|
||||
import sys
|
||||
|
||||
|
||||
def main():
|
||||
"""Main entry point for the 'nilmdb-fsck' command line script"""
|
||||
|
@ -23,5 +22,6 @@ def main():
|
|||
|
||||
nilmdb.fsck.Fsck(args.database, args.fix).check(skip_data=args.no_data)
|
||||
|
||||
|
||||
if __name__ == "__main__":
|
||||
main()
|
||||
|
|
|
@ -1,4 +1,4 @@
|
|||
#!/usr/bin/python
|
||||
#!/usr/bin/env python3
|
||||
|
||||
import os
|
||||
import sys
|
||||
|
@ -78,9 +78,12 @@ def main():
|
|||
stats = yappi.get_func_stats()
|
||||
stats.sort("ttot")
|
||||
stats.print_all()
|
||||
try:
|
||||
from IPython import embed
|
||||
embed(header="Use the `yappi` or `stats` object to explore "
|
||||
"further, quit to exit")
|
||||
embed(header="Use the `yappi` or `stats` object to "
|
||||
"explore further, `quit` to exit")
|
||||
except ModuleNotFoundError:
|
||||
print("\nInstall ipython to explore further")
|
||||
else:
|
||||
server.start(blocking=True)
|
||||
except nilmdb.server.serverutil.CherryPyExit:
|
||||
|
|
|
@ -1,4 +1,4 @@
|
|||
#!/usr/bin/python
|
||||
#!/usr/bin/env python3
|
||||
|
||||
import nilmdb.cmdline
|
||||
|
||||
|
|
|
@ -293,8 +293,8 @@ class Table():
|
|||
"layout": layout,
|
||||
"version": 3
|
||||
}
|
||||
with open(os.path.join(root, b"_format"), "wb") as f:
|
||||
pickle.dump(fmt, f, 2)
|
||||
nilmdb.utils.atomic.replace_file(
|
||||
os.path.join(root, b"_format"), pickle.dumps(fmt, 2))
|
||||
|
||||
# Normal methods
|
||||
def __init__(self, root, initial_nrows=0):
|
||||
|
|
|
@ -6,6 +6,7 @@ import sys
|
|||
import json
|
||||
import decorator
|
||||
import functools
|
||||
import threading
|
||||
|
||||
import cherrypy
|
||||
|
||||
|
@ -178,6 +179,19 @@ def cherrypy_patch_exit():
|
|||
os._exit = real_exit
|
||||
bus.exit = functools.partial(patched_exit, bus.exit)
|
||||
|
||||
# A behavior change in Python 3.8 means that some thread exceptions,
|
||||
# derived from SystemExit, now print tracebacks where they didn't
|
||||
# used to: https://bugs.python.org/issue1230540
|
||||
# Install a thread exception hook that ignores CherryPyExit;
|
||||
# to make this match the behavior where we didn't set
|
||||
# threading.excepthook, we also need to ignore SystemExit.
|
||||
def hook(args):
|
||||
if args.exc_type == CherryPyExit or args.exc_type == SystemExit:
|
||||
return
|
||||
sys.excepthook(args.exc_type, args.exc_value,
|
||||
args.exc_traceback) # pragma: no cover
|
||||
threading.excepthook = hook
|
||||
|
||||
|
||||
# Start/stop CherryPy standalone server
|
||||
def cherrypy_start(blocking=False, event=False):
|
||||
|
|
|
@ -26,7 +26,9 @@ class Timestamper():
|
|||
return b""
|
||||
if line[0:1] == b'#':
|
||||
continue
|
||||
break
|
||||
# For some reason, coverage on python 3.8 reports that
|
||||
# we never hit this break, even though we definitely do.
|
||||
break # pragma: no cover
|
||||
try:
|
||||
return next(self.ts_iter) + line
|
||||
except StopIteration:
|
||||
|
|
|
@ -1,16 +1,41 @@
|
|||
argcomplete>=1.10.0
|
||||
CherryPy>=18.1.2
|
||||
coverage>=4.5.4
|
||||
cython>=0.29.13
|
||||
decorator>=4.4.0
|
||||
fallocate>=1.6.4
|
||||
flake8>=3.7.8
|
||||
nose>=1.3.7
|
||||
numpy>=1.17.0
|
||||
progressbar>=2.5
|
||||
psutil>=5.6.3
|
||||
python-datetime-tz>=0.5.4
|
||||
python-dateutil>=2.8.0
|
||||
requests>=2.22.0
|
||||
tz>=0.2.2
|
||||
WebTest>=2.0.33
|
||||
argcomplete==1.12.0
|
||||
CherryPy==18.6.0
|
||||
coverage==5.2.1
|
||||
Cython==0.29.21
|
||||
decorator==4.4.2
|
||||
fallocate==1.6.4
|
||||
flake8==3.8.3
|
||||
nose==1.3.7
|
||||
numpy==1.19.1
|
||||
progressbar==2.5
|
||||
psutil==5.7.2
|
||||
python-datetime-tz==0.5.4
|
||||
python-dateutil==2.8.1
|
||||
requests==2.24.0
|
||||
tz==0.2.2
|
||||
yappi==1.2.5
|
||||
|
||||
## The following requirements were added by pip freeze:
|
||||
beautifulsoup4==4.9.1
|
||||
certifi==2020.6.20
|
||||
chardet==3.0.4
|
||||
cheroot==8.4.2
|
||||
idna==2.10
|
||||
jaraco.classes==3.1.0
|
||||
jaraco.collections==3.0.0
|
||||
jaraco.functools==3.0.1
|
||||
jaraco.text==3.2.0
|
||||
mccabe==0.6.1
|
||||
more-itertools==8.4.0
|
||||
portend==2.6
|
||||
pycodestyle==2.6.0
|
||||
pyflakes==2.2.0
|
||||
pytz==2020.1
|
||||
six==1.15.0
|
||||
soupsieve==2.0.1
|
||||
tempora==4.0.0
|
||||
urllib3==1.25.10
|
||||
waitress==1.4.4
|
||||
WebOb==1.8.6
|
||||
WebTest==2.0.35
|
||||
zc.lockfile==2.0
|
||||
|
|
|
@ -47,10 +47,13 @@ tag_prefix=nilmdb-
|
|||
parentdir_prefix=nilmdb-
|
||||
|
||||
[flake8]
|
||||
exclude=_version.py,fsck.py,nilmdb_fsck.py
|
||||
exclude=_version.py
|
||||
extend-ignore=E731
|
||||
per-file-ignores=__init__.py:F401,E402 serializer.py:E722 mustclose.py:E722
|
||||
per-file-ignores=__init__.py:F401,E402 \
|
||||
serializer.py:E722 \
|
||||
mustclose.py:E722 \
|
||||
fsck.py:E266
|
||||
|
||||
[pylint]
|
||||
ignore=_version.py,fsck.py,nilmdb_fsck.py
|
||||
ignore=_version.py
|
||||
disable=C0103,C0111,R0913,R0914
|
||||
|
|
2
setup.py
2
setup.py
|
@ -1,4 +1,4 @@
|
|||
#!/usr/bin/python
|
||||
#!/usr/bin/env python3
|
||||
|
||||
# To release a new version, tag it:
|
||||
# git tag -a nilmdb-1.1 -m "Version 1.1"
|
||||
|
|
BIN
tests/fsck-data/test1/data.sql
Normal file
BIN
tests/fsck-data/test1/data.sql
Normal file
Binary file not shown.
1
tests/fsck-data/test1/data/git-empty-dir-placeholder
Normal file
1
tests/fsck-data/test1/data/git-empty-dir-placeholder
Normal file
|
@ -0,0 +1 @@
|
|||
hi
|
1
tests/fsck-data/test1a/data/git-empty-dir-placeholder
Normal file
1
tests/fsck-data/test1a/data/git-empty-dir-placeholder
Normal file
|
@ -0,0 +1 @@
|
|||
hi
|
BIN
tests/fsck-data/test1b/data.sql
Normal file
BIN
tests/fsck-data/test1b/data.sql
Normal file
Binary file not shown.
BIN
tests/fsck-data/test1c/data.sql
Normal file
BIN
tests/fsck-data/test1c/data.sql
Normal file
Binary file not shown.
1
tests/fsck-data/test1c/data/git-empty-dir-placeholder
Normal file
1
tests/fsck-data/test1c/data/git-empty-dir-placeholder
Normal file
|
@ -0,0 +1 @@
|
|||
hi
|
BIN
tests/fsck-data/test2/data.sql
Normal file
BIN
tests/fsck-data/test2/data.sql
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2/data/a/b/0000/0000
Normal file
BIN
tests/fsck-data/test2/data/a/b/0000/0000
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2/data/a/b/_format
Normal file
BIN
tests/fsck-data/test2/data/a/b/_format
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2a/data.sql
Normal file
BIN
tests/fsck-data/test2a/data.sql
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2a/data/a/b/0000/0000
Normal file
BIN
tests/fsck-data/test2a/data/a/b/0000/0000
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2a/data/a/b/_format
Normal file
BIN
tests/fsck-data/test2a/data/a/b/_format
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2b/data.sql
Normal file
BIN
tests/fsck-data/test2b/data.sql
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2b/data/a/b/0000/0000
Normal file
BIN
tests/fsck-data/test2b/data/a/b/0000/0000
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2b/data/a/b/_format
Normal file
BIN
tests/fsck-data/test2b/data/a/b/_format
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2c/data.sql
Normal file
BIN
tests/fsck-data/test2c/data.sql
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2c/data/a/b/0000/0000
Normal file
BIN
tests/fsck-data/test2c/data/a/b/0000/0000
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2c/data/a/b/_format
Normal file
BIN
tests/fsck-data/test2c/data/a/b/_format
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2d/data.sql
Normal file
BIN
tests/fsck-data/test2d/data.sql
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2d/data/a/b/0000/0000
Normal file
BIN
tests/fsck-data/test2d/data/a/b/0000/0000
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2d/data/a/b/_format
Normal file
BIN
tests/fsck-data/test2d/data/a/b/_format
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2e/data.sql
Normal file
BIN
tests/fsck-data/test2e/data.sql
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2e/data/a/b/0000/0000
Normal file
BIN
tests/fsck-data/test2e/data/a/b/0000/0000
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2e/data/a/b/_format
Normal file
BIN
tests/fsck-data/test2e/data/a/b/_format
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2f/data.sql
Normal file
BIN
tests/fsck-data/test2f/data.sql
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2f/data/a/b/0000/0000
Normal file
BIN
tests/fsck-data/test2f/data/a/b/0000/0000
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2f/data/a/b/_format
Normal file
BIN
tests/fsck-data/test2f/data/a/b/_format
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2g/data.sql
Normal file
BIN
tests/fsck-data/test2g/data.sql
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2g/data/a/b/0000/0000
Normal file
BIN
tests/fsck-data/test2g/data/a/b/0000/0000
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2g/data/a/b/_format
Normal file
BIN
tests/fsck-data/test2g/data/a/b/_format
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2h/data.sql
Normal file
BIN
tests/fsck-data/test2h/data.sql
Normal file
Binary file not shown.
1
tests/fsck-data/test2h/data/git-empty-dir-placeholder
Normal file
1
tests/fsck-data/test2h/data/git-empty-dir-placeholder
Normal file
|
@ -0,0 +1 @@
|
|||
hi
|
BIN
tests/fsck-data/test2i/data.sql
Normal file
BIN
tests/fsck-data/test2i/data.sql
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2i/data/a/b/0000/0000
Normal file
BIN
tests/fsck-data/test2i/data/a/b/0000/0000
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2j/data.sql
Normal file
BIN
tests/fsck-data/test2j/data.sql
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2j/data/a/b/0000/0000
Normal file
BIN
tests/fsck-data/test2j/data/a/b/0000/0000
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2j/data/a/b/_format
Normal file
BIN
tests/fsck-data/test2j/data/a/b/_format
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2k/data.sql
Normal file
BIN
tests/fsck-data/test2k/data.sql
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2k/data/a/b/0000/0000
Normal file
BIN
tests/fsck-data/test2k/data/a/b/0000/0000
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2k/data/a/b/_format
Normal file
BIN
tests/fsck-data/test2k/data/a/b/_format
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2k1/data.sql
Normal file
BIN
tests/fsck-data/test2k1/data.sql
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2k1/data/a/b/0000/0000
Normal file
BIN
tests/fsck-data/test2k1/data/a/b/0000/0000
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2k1/data/a/b/_format
Normal file
BIN
tests/fsck-data/test2k1/data/a/b/_format
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2l/data.sql
Normal file
BIN
tests/fsck-data/test2l/data.sql
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2l/data/a/b/0000/0000
Normal file
BIN
tests/fsck-data/test2l/data/a/b/0000/0000
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2l/data/a/b/_format
Normal file
BIN
tests/fsck-data/test2l/data/a/b/_format
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2m/data.sql
Normal file
BIN
tests/fsck-data/test2m/data.sql
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2m/data/a/b/0000/0000
Normal file
BIN
tests/fsck-data/test2m/data/a/b/0000/0000
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2m/data/a/b/_format
Normal file
BIN
tests/fsck-data/test2m/data/a/b/_format
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2n/data.sql
Normal file
BIN
tests/fsck-data/test2n/data.sql
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2n/data/a/b/0000/0000
Normal file
BIN
tests/fsck-data/test2n/data/a/b/0000/0000
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2n/data/a/b/_format
Normal file
BIN
tests/fsck-data/test2n/data/a/b/_format
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2o/data.sql
Normal file
BIN
tests/fsck-data/test2o/data.sql
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2o/data/a/b/0000/0000
Normal file
BIN
tests/fsck-data/test2o/data/a/b/0000/0000
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2o/data/a/b/_format
Normal file
BIN
tests/fsck-data/test2o/data/a/b/_format
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2p/data.sql
Normal file
BIN
tests/fsck-data/test2p/data.sql
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2p/data/a/b/0000/0000
Normal file
BIN
tests/fsck-data/test2p/data/a/b/0000/0000
Normal file
Binary file not shown.
|
@ -0,0 +1 @@
|
|||
hi
|
BIN
tests/fsck-data/test2p/data/a/b/_format
Normal file
BIN
tests/fsck-data/test2p/data/a/b/_format
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2p1/data.sql
Normal file
BIN
tests/fsck-data/test2p1/data.sql
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2p1/data/a/b/0000/0000
Normal file
BIN
tests/fsck-data/test2p1/data/a/b/0000/0000
Normal file
Binary file not shown.
1
tests/fsck-data/test2p1/data/a/b/0001/hello
Normal file
1
tests/fsck-data/test2p1/data/a/b/0001/hello
Normal file
|
@ -0,0 +1 @@
|
|||
world
|
BIN
tests/fsck-data/test2p1/data/a/b/_format
Normal file
BIN
tests/fsck-data/test2p1/data/a/b/_format
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2p2/data.sql
Normal file
BIN
tests/fsck-data/test2p2/data.sql
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2p2/data/a/b/0000/0000
Normal file
BIN
tests/fsck-data/test2p2/data/a/b/0000/0000
Normal file
Binary file not shown.
1
tests/fsck-data/test2p2/data/a/b/0001/hello.removed
Normal file
1
tests/fsck-data/test2p2/data/a/b/0001/hello.removed
Normal file
|
@ -0,0 +1 @@
|
|||
world
|
BIN
tests/fsck-data/test2p2/data/a/b/_format
Normal file
BIN
tests/fsck-data/test2p2/data/a/b/_format
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2q/data.sql
Normal file
BIN
tests/fsck-data/test2q/data.sql
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2q/data/a/b/0000/0000
Normal file
BIN
tests/fsck-data/test2q/data/a/b/0000/0000
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2q/data/a/b/_format
Normal file
BIN
tests/fsck-data/test2q/data/a/b/_format
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2q/data/a/c/0000/0000
Normal file
BIN
tests/fsck-data/test2q/data/a/c/0000/0000
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2q/data/a/c/_format
Normal file
BIN
tests/fsck-data/test2q/data/a/c/_format
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2r/data.sql
Normal file
BIN
tests/fsck-data/test2r/data.sql
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2r/data/a/b/0000/0000
Normal file
BIN
tests/fsck-data/test2r/data/a/b/0000/0000
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2r/data/a/b/_format
Normal file
BIN
tests/fsck-data/test2r/data/a/b/_format
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2r1/data.sql
Normal file
BIN
tests/fsck-data/test2r1/data.sql
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2r1/data/a/b/0000/0000
Normal file
BIN
tests/fsck-data/test2r1/data/a/b/0000/0000
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2r1/data/a/b/_format
Normal file
BIN
tests/fsck-data/test2r1/data/a/b/_format
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2r2/data.sql
Normal file
BIN
tests/fsck-data/test2r2/data.sql
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2r2/data/a/b/0000/0000
Normal file
BIN
tests/fsck-data/test2r2/data/a/b/0000/0000
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2r2/data/a/b/_format
Normal file
BIN
tests/fsck-data/test2r2/data/a/b/_format
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2s/data.sql
Normal file
BIN
tests/fsck-data/test2s/data.sql
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2s/data/a/b/0000/0000
Normal file
BIN
tests/fsck-data/test2s/data/a/b/0000/0000
Normal file
Binary file not shown.
BIN
tests/fsck-data/test2s/data/a/b/_format
Normal file
BIN
tests/fsck-data/test2s/data/a/b/_format
Normal file
Binary file not shown.
Some files were not shown because too many files have changed in this diff Show More
Loading…
Reference in New Issue
Block a user