Compare commits
	
		
			122 Commits
		
	
	
		
			nilmdb-1.4
			...
			nilmdb-1.9
		
	
	| Author | SHA1 | Date | |
|---|---|---|---|
| 8dd8741100 | |||
| 8e6341ae5d | |||
| 422b1e2df2 | |||
| 0f745b3047 | |||
| 71cd7ed9b7 | |||
| a79d6104d5 | |||
| 8e8ec59e30 | |||
| b89b945a0f | |||
| bd7bdb2eb8 | |||
| 840cd2fd13 | |||
| bbd59c8b50 | |||
| 405c110fd7 | |||
| 274adcd856 | |||
| a1850c9c2c | |||
| 6cd28b67b1 | |||
| d6d215d53d | |||
| e02143ddb2 | |||
| e275384d03 | |||
| a6a67ec15c | |||
| fc43107307 | |||
| 90633413bb | |||
| c7c3aff0fb | |||
| e2347c954e | |||
| 222a5c6c53 | |||
| 1ca2c143e5 | |||
| b5df575c79 | |||
| 2768a5ad15 | |||
| a105543c38 | |||
| 309f38d0ed | |||
| 9a27b6ef6a | |||
| 99532cf9e0 | |||
| dfdd0e5c74 | |||
| 9a2699adfc | |||
| 9bbb95b18b | |||
| 6bbed322c5 | |||
| 2317894355 | |||
| 539c92226c | |||
| 77c766d85d | |||
| 49d04db1d6 | |||
| ea838d05ae | |||
| f2a48bdb2a | |||
| 6d14e0b8aa | |||
| b31b9327b9 | |||
| b98ff1331a | |||
| 00e6ba1124 | |||
| 01029230c9 | |||
| ecc4e5ef9d | |||
| 23f31c472b | |||
| a1e2746360 | |||
| 1c40d59a52 | |||
| bfb09a189f | |||
| 416a499866 | |||
| 637d193807 | |||
| b7fa5745ce | |||
| 0104c8edd9 | |||
| cf3b8e787d | |||
| 83d022016c | |||
| 43b740ecaa | |||
| 4ce059b920 | |||
| 99a4228285 | |||
| 230ec72609 | |||
| d36ece3767 | |||
| 231963538e | |||
| b4d6aad6de | |||
| e95142eabf | |||
| d21c3470bc | |||
| 7576883f49 | |||
| cc211542f8 | |||
| 8292dcf70b | |||
| b362fd37f6 | |||
| 41ec13ee17 | |||
| efa9aa9097 | |||
| d9afb48f45 | |||
| d1140e0f16 | |||
| 6091e44561 | |||
| e233ba790f | |||
| f0304b4c00 | |||
| 60594ca58e | |||
| c7f2df4abc | |||
| 5b7409f802 | |||
| 06038062a2 | |||
| ae9fe89759 | |||
| 04def60021 | |||
| 9ce0f69dff | |||
| 90c3be91c4 | |||
| ebccfb3531 | |||
| e006f1d02e | |||
| 5292319802 | |||
| 173121ca87 | |||
| 26bab031bd | |||
| b5fefffa09 | |||
| dccb3e370a | |||
| 95ca55aa7e | |||
| e01813f29d | |||
| 7f41e117a2 | |||
| dd5fc806e5 | |||
| f8ca8d31e6 | |||
| ed89d803f0 | |||
| 3d24092cd2 | |||
| 304bb43d85 | |||
| 59a79a30a5 | |||
| c0d450d39e | |||
| 6f14d609b2 | |||
| 77ef87456f | |||
| 32d6af935c | |||
| 6af3a6fc41 | |||
| f8a06fb3b7 | |||
| e790bb9e8a | |||
| 89be6f5931 | |||
| 4cdef3285d | |||
| bcd82c4d59 | |||
| caf63ab01f | |||
| 2d72891162 | |||
| cda2ac3e77 | |||
| 57d3d60f6a | |||
| d6b5befe76 | |||
| 7429c1788d | |||
| 0ef71c193b | |||
| 4a50dd015e | |||
| 22274550ab | |||
| 4f06d6ae68 | |||
| c54d8041c3 | 
| @@ -7,4 +7,4 @@ | |||||||
| exclude_lines = | exclude_lines = | ||||||
| 	pragma: no cover | 	pragma: no cover | ||||||
| 	if 0: | 	if 0: | ||||||
| omit = nilmdb/utils/datetime_tz*,nilmdb/scripts,nilmdb/_version.py | omit = nilmdb/utils/datetime_tz*,nilmdb/scripts,nilmdb/_version.py,nilmdb/fsck | ||||||
|   | |||||||
							
								
								
									
										6
									
								
								Makefile
									
									
									
									
									
								
							
							
						
						
									
										6
									
								
								Makefile
									
									
									
									
									
								
							| @@ -1,5 +1,5 @@ | |||||||
| # By default, run the tests. | # By default, run the tests. | ||||||
| all: test | all: fscktest | ||||||
|  |  | ||||||
| version: | version: | ||||||
| 	python setup.py version | 	python setup.py version | ||||||
| @@ -23,6 +23,10 @@ docs: | |||||||
| lint: | lint: | ||||||
| 	pylint --rcfile=.pylintrc nilmdb | 	pylint --rcfile=.pylintrc nilmdb | ||||||
|  |  | ||||||
|  | fscktest: | ||||||
|  | 	python -c "import nilmdb.fsck; nilmdb.fsck.Fsck('/home/jim/wsgi/db').check()" | ||||||
|  | #	python -c "import nilmdb.fsck; nilmdb.fsck.Fsck('/home/jim/mnt/bucket/mnt/sharon/data/db', True).check()" | ||||||
|  |  | ||||||
| test: | test: | ||||||
| ifeq ($(INSIDE_EMACS), t) | ifeq ($(INSIDE_EMACS), t) | ||||||
| # Use the slightly more flexible script | # Use the slightly more flexible script | ||||||
|   | |||||||
| @@ -8,7 +8,11 @@ Prerequisites: | |||||||
|  |  | ||||||
|   # Base NilmDB dependencies |   # Base NilmDB dependencies | ||||||
|   sudo apt-get install python-cherrypy3 python-decorator python-simplejson |   sudo apt-get install python-cherrypy3 python-decorator python-simplejson | ||||||
|   sudo apt-get install python-requests python-dateutil python-tz python-psutil |   sudo apt-get install python-requests python-dateutil python-tz | ||||||
|  |   sudo apt-get install python-progressbar python-psutil | ||||||
|  |  | ||||||
|  |   # Other dependencies (required by some modules) | ||||||
|  |   sudo apt-get install python-numpy | ||||||
|  |  | ||||||
|   # Tools for running tests |   # Tools for running tests | ||||||
|   sudo apt-get install python-nose python-coverage |   sudo apt-get install python-nose python-coverage | ||||||
| @@ -23,4 +27,7 @@ Install: | |||||||
| Usage: | Usage: | ||||||
|  |  | ||||||
|   nilmdb-server --help |   nilmdb-server --help | ||||||
|  |   nilmdb-fsck --help | ||||||
|   nilmtool --help |   nilmtool --help | ||||||
|  |  | ||||||
|  | See docs/wsgi.md for info on setting up a WSGI application in Apache. | ||||||
|   | |||||||
| @@ -186,6 +186,19 @@ IntervalSet speed | |||||||
|     - rbtree and interval converted to cython: |     - rbtree and interval converted to cython: | ||||||
|       8.4 μS, total 12 s, 134 MB RAM |       8.4 μS, total 12 s, 134 MB RAM | ||||||
|  |  | ||||||
|  | - Would like to move Interval itself back to Python so other | ||||||
|  |   non-cythonized code like client code can use it more easily. | ||||||
|  |   Testing speed with just `test_interval` being tested, with | ||||||
|  |   `range(5,22)`, using `/usr/bin/time -v python tests/runtests.py`, | ||||||
|  |   times recorded for 2097152: | ||||||
|  |     - 52ae397 (Interval in cython): | ||||||
|  | 	  12.6133 μs each, ratio 0.866533, total 47 sec, 399 MB RAM | ||||||
|  | 	- 9759dcf (Interval in python): | ||||||
|  | 	  21.2937 μs each, ratio 1.462870, total 83 sec, 1107 MB RAM | ||||||
|  |   That's a huge difference!  Instead, will keep Interval and DBInterval | ||||||
|  |   cythonized inside nilmdb, and just have an additional copy in | ||||||
|  |   nilmdb.utils for clients to use. | ||||||
|  |  | ||||||
| Layouts | Layouts | ||||||
| ------- | ------- | ||||||
| Current/old design has specific layouts: RawData, PrepData, RawNotchedData. | Current/old design has specific layouts: RawData, PrepData, RawNotchedData. | ||||||
| @@ -376,3 +389,52 @@ Possible solutions: | |||||||
|     are always printed as int64 values, and a new format |     are always printed as int64 values, and a new format | ||||||
|     "@1234567890123456" is added to the parser for specifying them |     "@1234567890123456" is added to the parser for specifying them | ||||||
|     exactly. |     exactly. | ||||||
|  |  | ||||||
|  | Binary interface | ||||||
|  | ---------------- | ||||||
|  |  | ||||||
|  | The ASCII interface is too slow for high-bandwidth processing, like | ||||||
|  | sinefits, prep, etc.  A binary interface was added so that you can | ||||||
|  | extract the raw binary out of the bulkdata storage.  This binary is | ||||||
|  | a little-endian format, e.g. in C a uint16_6 stream would be: | ||||||
|  |  | ||||||
|  |     #include <endian.h> | ||||||
|  |     #include <stdint.h> | ||||||
|  |     struct { | ||||||
|  |         int64_t timestamp_le; | ||||||
|  |         uint16_t data_le[6]; | ||||||
|  |     } __attribute__((packed)); | ||||||
|  |  | ||||||
|  | Remember to byteswap (with e.g. `letoh` in C)! | ||||||
|  |  | ||||||
|  | This interface is used by the new `nilmdb.client.numpyclient.NumpyClient` | ||||||
|  | class, which is a subclass of the normal `nilmcb.client.client.Client` | ||||||
|  | and has all of the same functions.  It adds three new functions: | ||||||
|  |  | ||||||
|  | - `stream_extract_numpy` to extract data as a Numpy array | ||||||
|  |  | ||||||
|  | - `stream_insert_numpy` to insert data as a Numpy array | ||||||
|  |  | ||||||
|  | - `stream_insert_numpy_context` is the context manager for | ||||||
|  |   incrementally inserting data | ||||||
|  |  | ||||||
|  | It is significantly faster!  It is about 20 times faster to decimate a | ||||||
|  | stream with `nilm-decimate` when the filter code is using the new | ||||||
|  | binary/numpy interface. | ||||||
|  |  | ||||||
|  |  | ||||||
|  | WSGI interface & chunked requests | ||||||
|  | --------------------------------- | ||||||
|  |  | ||||||
|  | mod_wsgi requires "WSGIChunkedRequest On" to handle | ||||||
|  | "Transfer-encoding: Chunked" requests.  However, `/stream/insert` | ||||||
|  | doesn't handle this correctly right now, because: | ||||||
|  |  | ||||||
|  | - The `cherrpy.request.body.read()` call needs to be fixed for chunked requests | ||||||
|  |  | ||||||
|  | - We don't want to just buffer endlessly in the server, and it will | ||||||
|  |   require some thought on how to handle data in chunks (what to do about | ||||||
|  |   interval endpoints). | ||||||
|  |  | ||||||
|  | It is probably better to just keep the endpoint management on the client | ||||||
|  | side, so leave "WSGIChunkedRequest off" for now. | ||||||
|   | |||||||
							
								
								
									
										32
									
								
								docs/wsgi.md
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										32
									
								
								docs/wsgi.md
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,32 @@ | |||||||
|  | WSGI Application in Apache | ||||||
|  | -------------------------- | ||||||
|  |  | ||||||
|  | Install `apache2` and `libapache2-mod-wsgi` | ||||||
|  |  | ||||||
|  | We'll set up the database server at URL `http://myhost.com/nilmdb`. | ||||||
|  | The database will be stored in `/home/nilm/db`, and the process will | ||||||
|  | run as user `nilm`, group `nilm`. | ||||||
|  |  | ||||||
|  | First, create a WSGI script `/home/nilm/nilmdb.wsgi` containing: | ||||||
|  |  | ||||||
|  |     import nilmdb.server | ||||||
|  |     application = nilmdb.server.wsgi_application("/home/nilm/db", "/nilmdb") | ||||||
|  |  | ||||||
|  | The first parameter is the local filesystem path, and the second | ||||||
|  | parameter is the path part of the URL. | ||||||
|  |  | ||||||
|  | Then, set up Apache with a configuration like: | ||||||
|  |  | ||||||
|  |     <VirtualHost> | ||||||
|  |         WSGIScriptAlias /nilmdb /home/nilm/nilmdb.wsgi | ||||||
|  |         WSGIDaemonProcess nilmdb-procgroup threads=32 user=nilm group=nilm | ||||||
|  |         <Location /nilmdb> | ||||||
|  |             WSGIProcessGroup nilmdb-procgroup | ||||||
|  |             WSGIApplicationGroup nilmdb-appgroup | ||||||
|  |  | ||||||
|  |             # Access control example: | ||||||
|  |             Order deny,allow | ||||||
|  |             Deny from all | ||||||
|  |             Allow from 1.2.3.4 | ||||||
|  |         </Location> | ||||||
|  |     </VirtualHost> | ||||||
							
								
								
									
										50
									
								
								extras/fix-oversize-files.py
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										50
									
								
								extras/fix-oversize-files.py
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,50 @@ | |||||||
|  | #!/usr/bin/python | ||||||
|  |  | ||||||
|  | import os | ||||||
|  | import sys | ||||||
|  | import cPickle as pickle | ||||||
|  | import argparse | ||||||
|  | import fcntl | ||||||
|  | import re | ||||||
|  | from nilmdb.client.numpyclient import layout_to_dtype | ||||||
|  |  | ||||||
|  | parser = argparse.ArgumentParser( | ||||||
|  |     description = """ | ||||||
|  | Fix database corruption where binary writes caused too much data to be | ||||||
|  | written to the file.  Truncates files to the correct length.  This was | ||||||
|  | fixed by b98ff1331a515ad47fd3203615e835b529b039f9. | ||||||
|  | """) | ||||||
|  | parser.add_argument("path", action="store", help='Database root path') | ||||||
|  | parser.add_argument("-y", "--yes", action="store_true", help='Fix them') | ||||||
|  | args = parser.parse_args() | ||||||
|  |  | ||||||
|  | lock = os.path.join(args.path, "data.lock") | ||||||
|  | with open(lock, "w") as f: | ||||||
|  |     fcntl.flock(f.fileno(), fcntl.LOCK_EX | fcntl.LOCK_NB) | ||||||
|  |  | ||||||
|  |     fix = {} | ||||||
|  |  | ||||||
|  |     for (path, dirs, files) in os.walk(args.path): | ||||||
|  |         if "_format" in files: | ||||||
|  |             with open(os.path.join(path, "_format")) as format: | ||||||
|  |                 fmt = pickle.load(format) | ||||||
|  |                 rowsize = layout_to_dtype(fmt["layout"]).itemsize | ||||||
|  |                 maxsize = rowsize * fmt["rows_per_file"] | ||||||
|  |                 fix[path] = maxsize | ||||||
|  |                 if maxsize < 128000000: # sanity check | ||||||
|  |                     raise Exception("bad maxsize " + str(maxsize)) | ||||||
|  |  | ||||||
|  |     for fixpath in fix: | ||||||
|  |         for (path, dirs, files) in os.walk(fixpath): | ||||||
|  |             for fn in files: | ||||||
|  |                 if not re.match("^[0-9a-f]{4,}$", fn): | ||||||
|  |                     continue | ||||||
|  |                 fn = os.path.join(path, fn) | ||||||
|  |                 size = os.path.getsize(fn) | ||||||
|  |                 maxsize = fix[fixpath] | ||||||
|  |                 if size > maxsize: | ||||||
|  |                     diff = size - maxsize | ||||||
|  |                     print diff, "too big:", fn | ||||||
|  |                     if args.yes: | ||||||
|  |                         with open(fn, "a+") as dbfile: | ||||||
|  |                             dbfile.truncate(maxsize) | ||||||
| @@ -17,4 +17,4 @@ _nilmtool_argcomplete() { | |||||||
|         unset COMPREPLY |         unset COMPREPLY | ||||||
|     fi |     fi | ||||||
| } | } | ||||||
| complete -o nospace -o default -F _nilmtool_argcomplete nilmtool | complete -o nospace -F _nilmtool_argcomplete nilmtool | ||||||
|   | |||||||
| @@ -58,6 +58,11 @@ class Client(object): | |||||||
|         return self.http.get("dbinfo") |         return self.http.get("dbinfo") | ||||||
|  |  | ||||||
|     def stream_list(self, path = None, layout = None, extended = False): |     def stream_list(self, path = None, layout = None, extended = False): | ||||||
|  |         """Return a sorted list of [path, layout] lists.  If 'path' or | ||||||
|  |         'layout' are specified, only return streams that match those | ||||||
|  |         exact values.  If 'extended' is True, the returned lists have | ||||||
|  |         extended info, e.g.: [path, layout, extent_min, extent_max, | ||||||
|  |         total_rows, total_seconds.""" | ||||||
|         params = {} |         params = {} | ||||||
|         if path is not None: |         if path is not None: | ||||||
|             params["path"] = path |             params["path"] = path | ||||||
| @@ -65,9 +70,11 @@ class Client(object): | |||||||
|             params["layout"] = layout |             params["layout"] = layout | ||||||
|         if extended: |         if extended: | ||||||
|             params["extended"] = 1 |             params["extended"] = 1 | ||||||
|         return self.http.get("stream/list", params) |         streams = self.http.get("stream/list", params) | ||||||
|  |         return nilmdb.utils.sort.sort_human(streams, key = lambda s: s[0]) | ||||||
|  |  | ||||||
|     def stream_get_metadata(self, path, keys = None): |     def stream_get_metadata(self, path, keys = None): | ||||||
|  |         """Get stream metadata""" | ||||||
|         params = { "path": path } |         params = { "path": path } | ||||||
|         if keys is not None: |         if keys is not None: | ||||||
|             params["key"] = keys |             params["key"] = keys | ||||||
| @@ -97,7 +104,7 @@ class Client(object): | |||||||
|         return self.http.post("stream/create", params) |         return self.http.post("stream/create", params) | ||||||
|  |  | ||||||
|     def stream_destroy(self, path): |     def stream_destroy(self, path): | ||||||
|         """Delete stream and its contents""" |         """Delete stream.  Fails if any data is still present.""" | ||||||
|         params = { "path": path } |         params = { "path": path } | ||||||
|         return self.http.post("stream/destroy", params) |         return self.http.post("stream/destroy", params) | ||||||
|  |  | ||||||
| @@ -116,15 +123,19 @@ class Client(object): | |||||||
|             params["start"] = timestamp_to_string(start) |             params["start"] = timestamp_to_string(start) | ||||||
|         if end is not None: |         if end is not None: | ||||||
|             params["end"] = timestamp_to_string(end) |             params["end"] = timestamp_to_string(end) | ||||||
|         return self.http.post("stream/remove", params) |         total = 0 | ||||||
|  |         for count in self.http.post_gen("stream/remove", params): | ||||||
|  |             total += int(count) | ||||||
|  |         return total | ||||||
|  |  | ||||||
|     @contextlib.contextmanager |     @contextlib.contextmanager | ||||||
|     def stream_insert_context(self, path, start = None, end = None): |     def stream_insert_context(self, path, start = None, end = None): | ||||||
|         """Return a context manager that allows data to be efficiently |         """Return a context manager that allows data to be efficiently | ||||||
|         inserted into a stream in a piecewise manner.  Data is be provided |         inserted into a stream in a piecewise manner.  Data is | ||||||
|         as single lines, and is aggregated and sent to the server in larger |         provided as ASCII lines, and is aggregated and sent to the | ||||||
|         chunks as necessary.  Data lines must match the database layout for |         server in larger or smaller chunks as necessary.  Data lines | ||||||
|         the given path, and end with a newline. |         must match the database layout for the given path, and end | ||||||
|  |         with a newline. | ||||||
|  |  | ||||||
|         Example: |         Example: | ||||||
|           with client.stream_insert_context('/path', start, end) as ctx: |           with client.stream_insert_context('/path', start, end) as ctx: | ||||||
| @@ -136,15 +147,17 @@ class Client(object): | |||||||
|         This may make multiple requests to the server, if the data is |         This may make multiple requests to the server, if the data is | ||||||
|         large enough or enough time has passed between insertions. |         large enough or enough time has passed between insertions. | ||||||
|         """ |         """ | ||||||
|         ctx = StreamInserter(self.http, path, start, end) |         ctx = StreamInserter(self, path, start, end) | ||||||
|         yield ctx |         yield ctx | ||||||
|         ctx.finalize() |         ctx.finalize() | ||||||
|  |         ctx.destroy() | ||||||
|  |  | ||||||
|     def stream_insert(self, path, data, start = None, end = None): |     def stream_insert(self, path, data, start = None, end = None): | ||||||
|         """Insert rows of data into a stream.  data should be a string |         """Insert rows of data into a stream.  data should be a string | ||||||
|         or iterable that provides ASCII data that matches the database |         or iterable that provides ASCII data that matches the database | ||||||
|         layout for path.  See stream_insert_context for details on the |         layout for path.  Data is passed through stream_insert_context, | ||||||
|         'start' and 'end' parameters.""" |         so it will be broken into reasonably-sized chunks and | ||||||
|  |         start/end will be deduced if missing.""" | ||||||
|         with self.stream_insert_context(path, start, end) as ctx: |         with self.stream_insert_context(path, start, end) as ctx: | ||||||
|             if isinstance(data, basestring): |             if isinstance(data, basestring): | ||||||
|                 ctx.insert(data) |                 ctx.insert(data) | ||||||
| @@ -153,11 +166,28 @@ class Client(object): | |||||||
|                     ctx.insert(chunk) |                     ctx.insert(chunk) | ||||||
|         return ctx.last_response |         return ctx.last_response | ||||||
|  |  | ||||||
|  |     def stream_insert_block(self, path, data, start, end, binary = False): | ||||||
|  |         """Insert a single fixed block of data into the stream.  It is | ||||||
|  |         sent directly to the server in one block with no further | ||||||
|  |         processing. | ||||||
|  |  | ||||||
|  |         If 'binary' is True, provide raw binary data in little-endian | ||||||
|  |         format matching the path layout, including an int64 timestamp. | ||||||
|  |         Otherwise, provide ASCII data matching the layout.""" | ||||||
|  |         params = { | ||||||
|  |             "path": path, | ||||||
|  |             "start": timestamp_to_string(start), | ||||||
|  |             "end": timestamp_to_string(end), | ||||||
|  |         } | ||||||
|  |         if binary: | ||||||
|  |             params["binary"] = 1 | ||||||
|  |         return self.http.put("stream/insert", data, params, binary = binary) | ||||||
|  |  | ||||||
|     def stream_intervals(self, path, start = None, end = None, diffpath = None): |     def stream_intervals(self, path, start = None, end = None, diffpath = None): | ||||||
|         """ |         """ | ||||||
|         Return a generator that yields each stream interval. |         Return a generator that yields each stream interval. | ||||||
|  |  | ||||||
|         If diffpath is not None, yields only interval ranges that are |         If 'diffpath' is not None, yields only interval ranges that are | ||||||
|         present in 'path' but not in 'diffpath'. |         present in 'path' but not in 'diffpath'. | ||||||
|         """ |         """ | ||||||
|         params = { |         params = { | ||||||
| @@ -171,14 +201,23 @@ class Client(object): | |||||||
|             params["end"] = timestamp_to_string(end) |             params["end"] = timestamp_to_string(end) | ||||||
|         return self.http.get_gen("stream/intervals", params) |         return self.http.get_gen("stream/intervals", params) | ||||||
|  |  | ||||||
|     def stream_extract(self, path, start = None, end = None, count = False): |     def stream_extract(self, path, start = None, end = None, | ||||||
|  |                        count = False, markup = False, binary = False): | ||||||
|         """ |         """ | ||||||
|         Extract data from a stream.  Returns a generator that yields |         Extract data from a stream.  Returns a generator that yields | ||||||
|         lines of ASCII-formatted data that matches the database |         lines of ASCII-formatted data that matches the database | ||||||
|         layout for the given path. |         layout for the given path. | ||||||
|  |  | ||||||
|         Specify count = True to return a count of matching data points |         If 'count' is True, return a count of matching data points | ||||||
|         rather than the actual data.  The output format is unchanged. |         rather than the actual data.  The output format is unchanged. | ||||||
|  |  | ||||||
|  |         If 'markup' is True, include comments in the returned data | ||||||
|  |         that indicate interval starts and ends. | ||||||
|  |  | ||||||
|  |         If 'binary' is True, return chunks of raw binary data, rather | ||||||
|  |         than lines of ASCII-formatted data.  Raw binary data is | ||||||
|  |         little-endian and matches the database types (including an | ||||||
|  |         int64 timestamp). | ||||||
|         """ |         """ | ||||||
|         params = { |         params = { | ||||||
|             "path": path, |             "path": path, | ||||||
| @@ -189,7 +228,11 @@ class Client(object): | |||||||
|             params["end"] = timestamp_to_string(end) |             params["end"] = timestamp_to_string(end) | ||||||
|         if count: |         if count: | ||||||
|             params["count"] = 1 |             params["count"] = 1 | ||||||
|         return self.http.get_gen("stream/extract", params) |         if markup: | ||||||
|  |             params["markup"] = 1 | ||||||
|  |         if binary: | ||||||
|  |             params["binary"] = 1 | ||||||
|  |         return self.http.get_gen("stream/extract", params, binary = binary) | ||||||
|  |  | ||||||
|     def stream_count(self, path, start = None, end = None): |     def stream_count(self, path, start = None, end = None): | ||||||
|         """ |         """ | ||||||
| @@ -238,13 +281,13 @@ class StreamInserter(object): | |||||||
|     _max_data = 2 * 1024 * 1024 |     _max_data = 2 * 1024 * 1024 | ||||||
|     _max_data_after_send = 64 * 1024 |     _max_data_after_send = 64 * 1024 | ||||||
|  |  | ||||||
|     def __init__(self, http, path, start = None, end = None): |     def __init__(self, client, path, start, end): | ||||||
|         """'http' is the httpclient object.  'path' is the database |         """'client' is the client object.  'path' is the database | ||||||
|         path to insert to.  'start' and 'end' are used for the first |         path to insert to.  'start' and 'end' are used for the first | ||||||
|         contiguous interval.""" |         contiguous interval and may be None.""" | ||||||
|         self.last_response = None |         self.last_response = None | ||||||
|  |  | ||||||
|         self._http = http |         self._client = client | ||||||
|         self._path = path |         self._path = path | ||||||
|  |  | ||||||
|         # Start and end for the overall contiguous interval we're |         # Start and end for the overall contiguous interval we're | ||||||
| @@ -257,6 +300,15 @@ class StreamInserter(object): | |||||||
|         self._block_data = [] |         self._block_data = [] | ||||||
|         self._block_len = 0 |         self._block_len = 0 | ||||||
|  |  | ||||||
|  |         self.destroyed = False | ||||||
|  |  | ||||||
|  |     def destroy(self): | ||||||
|  |         """Ensure this object can't be used again without raising | ||||||
|  |         an error""" | ||||||
|  |         def error(*args, **kwargs): | ||||||
|  |             raise Exception("don't reuse this context object") | ||||||
|  |         self._send_block = self.insert = self.finalize = self.send = error | ||||||
|  |  | ||||||
|     def insert(self, data): |     def insert(self, data): | ||||||
|         """Insert a chunk of ASCII formatted data in string form.  The |         """Insert a chunk of ASCII formatted data in string form.  The | ||||||
|         overall data must consist of lines terminated by '\\n'.""" |         overall data must consist of lines terminated by '\\n'.""" | ||||||
| @@ -307,6 +359,11 @@ class StreamInserter(object): | |||||||
|         part of a new interval and there may be a gap left in-between.""" |         part of a new interval and there may be a gap left in-between.""" | ||||||
|         self._send_block(final = True) |         self._send_block(final = True) | ||||||
|  |  | ||||||
|  |     def send(self): | ||||||
|  |         """Send any data that we might have buffered up.  Does not affect | ||||||
|  |         any other treatment of timestamps or endpoints.""" | ||||||
|  |         self._send_block(final = False) | ||||||
|  |  | ||||||
|     def _get_first_noncomment(self, block): |     def _get_first_noncomment(self, block): | ||||||
|         """Return the (start, end) indices of the first full line in |         """Return the (start, end) indices of the first full line in | ||||||
|         block that isn't a comment, or raise IndexError if |         block that isn't a comment, or raise IndexError if | ||||||
| @@ -398,7 +455,7 @@ class StreamInserter(object): | |||||||
|             self._interval_start = end_ts |             self._interval_start = end_ts | ||||||
|  |  | ||||||
|         # Double check endpoints |         # Double check endpoints | ||||||
|         if start_ts is None or end_ts is None: |         if (start_ts is None or end_ts is None) or (start_ts == end_ts): | ||||||
|             # If the block has no non-comment lines, it's OK |             # If the block has no non-comment lines, it's OK | ||||||
|             try: |             try: | ||||||
|                 self._get_first_noncomment(block) |                 self._get_first_noncomment(block) | ||||||
| @@ -407,9 +464,7 @@ class StreamInserter(object): | |||||||
|             raise ClientError("have data to send, but no start/end times") |             raise ClientError("have data to send, but no start/end times") | ||||||
|  |  | ||||||
|         # Send it |         # Send it | ||||||
|         params = { "path": self._path, |         self.last_response = self._client.stream_insert_block( | ||||||
|                    "start": timestamp_to_string(start_ts), |             self._path, block, start_ts, end_ts, binary = False) | ||||||
|                    "end": timestamp_to_string(end_ts) } |  | ||||||
|         self.last_response = self._http.put("stream/insert", block, params) |  | ||||||
|  |  | ||||||
|         return |         return | ||||||
|   | |||||||
| @@ -16,7 +16,7 @@ class HTTPClient(object): | |||||||
|         reparsed = urlparse.urlparse(baseurl).geturl() |         reparsed = urlparse.urlparse(baseurl).geturl() | ||||||
|         if '://' not in reparsed: |         if '://' not in reparsed: | ||||||
|             reparsed = urlparse.urlparse("http://" + baseurl).geturl() |             reparsed = urlparse.urlparse("http://" + baseurl).geturl() | ||||||
|         self.baseurl = reparsed |         self.baseurl = reparsed.rstrip('/') + '/' | ||||||
|  |  | ||||||
|         # Build Requests session object, enable SSL verification |         # Build Requests session object, enable SSL verification | ||||||
|         self.session = requests.Session() |         self.session = requests.Session() | ||||||
| @@ -105,12 +105,17 @@ class HTTPClient(object): | |||||||
|         else: |         else: | ||||||
|             return self._req("POST", url, None, params) |             return self._req("POST", url, None, params) | ||||||
|  |  | ||||||
|     def put(self, url, data, params = None): |     def put(self, url, data, params = None, binary = False): | ||||||
|         """Simple PUT (parameters in URL, data in body)""" |         """Simple PUT (parameters in URL, data in body)""" | ||||||
|         return self._req("PUT", url, params, data) |         if binary: | ||||||
|  |             h = { 'Content-type': 'application/octet-stream' } | ||||||
|  |         else: | ||||||
|  |             h = { 'Content-type': 'text/plain; charset=utf-8' } | ||||||
|  |         return self._req("PUT", url, query = params, body = data, headers = h) | ||||||
|  |  | ||||||
|     # Generator versions that return data one line at a time. |     # Generator versions that return data one line at a time. | ||||||
|     def _req_gen(self, method, url, query = None, body = None, headers = None): |     def _req_gen(self, method, url, query = None, body = None, | ||||||
|  |                  headers = None, binary = False): | ||||||
|         """ |         """ | ||||||
|         Make a request and return a generator that gives back strings |         Make a request and return a generator that gives back strings | ||||||
|         or JSON decoded lines of the body data, or raise an error if |         or JSON decoded lines of the body data, or raise an error if | ||||||
| @@ -118,16 +123,50 @@ class HTTPClient(object): | |||||||
|         """ |         """ | ||||||
|         (response, isjson) = self._do_req(method, url, query, body, |         (response, isjson) = self._do_req(method, url, query, body, | ||||||
|                                           stream = True, headers = headers) |                                           stream = True, headers = headers) | ||||||
|         if isjson: |  | ||||||
|             for line in response.iter_lines(): |         # Like the iter_lines function in Requests, but only splits on | ||||||
|  |         # the specified line ending. | ||||||
|  |         def lines(source, ending): | ||||||
|  |             pending = None | ||||||
|  |             for chunk in source: | ||||||
|  |                 if pending is not None: | ||||||
|  |                     chunk = pending + chunk | ||||||
|  |                 tmp = chunk.split(ending) | ||||||
|  |                 lines = tmp[:-1] | ||||||
|  |                 if chunk.endswith(ending): | ||||||
|  |                     pending = None | ||||||
|  |                 else: | ||||||
|  |                     pending = tmp[-1] | ||||||
|  |                 for line in lines: | ||||||
|  |                     yield line | ||||||
|  |             if pending is not None: # pragma: no cover (missing newline) | ||||||
|  |                 yield pending | ||||||
|  |  | ||||||
|  |         # Yield the chunks or lines as requested | ||||||
|  |         if binary: | ||||||
|  |             for chunk in response.iter_content(chunk_size = 65536): | ||||||
|  |                 yield chunk | ||||||
|  |         elif isjson: | ||||||
|  |             for line in lines(response.iter_content(chunk_size = 1), | ||||||
|  |                               ending = '\r\n'): | ||||||
|                 yield json.loads(line) |                 yield json.loads(line) | ||||||
|         else: |         else: | ||||||
|             for line in response.iter_lines(): |             for line in lines(response.iter_content(chunk_size = 65536), | ||||||
|  |                               ending = '\n'): | ||||||
|                 yield line |                 yield line | ||||||
|  |  | ||||||
|     def get_gen(self, url, params = None): |     def get_gen(self, url, params = None, binary = False): | ||||||
|         """Simple GET (parameters in URL) returning a generator""" |         """Simple GET (parameters in URL) returning a generator""" | ||||||
|         return self._req_gen("GET", url, params) |         return self._req_gen("GET", url, params, binary = binary) | ||||||
|  |  | ||||||
|  |     def post_gen(self, url, params = None): | ||||||
|  |         """Simple POST (parameters in body) returning a generator""" | ||||||
|  |         if self.post_json: | ||||||
|  |             return self._req_gen("POST", url, None, | ||||||
|  |                                  json.dumps(params), | ||||||
|  |                                  { 'Content-type': 'application/json' }) | ||||||
|  |         else: | ||||||
|  |             return self._req_gen("POST", url, None, params) | ||||||
|  |  | ||||||
|     # Not much use for a POST or PUT generator, since they don't |     # Not much use for a POST or PUT generator, since they don't | ||||||
|     # return much data. |     # return much data. | ||||||
|   | |||||||
							
								
								
									
										258
									
								
								nilmdb/client/numpyclient.py
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										258
									
								
								nilmdb/client/numpyclient.py
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,258 @@ | |||||||
|  | # -*- coding: utf-8 -*- | ||||||
|  |  | ||||||
|  | """Provide a NumpyClient class that is based on normal Client, but has | ||||||
|  | additional methods for extracting and inserting data via Numpy arrays.""" | ||||||
|  |  | ||||||
|  | import nilmdb.utils | ||||||
|  | import nilmdb.client.client | ||||||
|  | import nilmdb.client.httpclient | ||||||
|  | from nilmdb.client.errors import ClientError | ||||||
|  |  | ||||||
|  | import contextlib | ||||||
|  | from nilmdb.utils.time import timestamp_to_string, string_to_timestamp | ||||||
|  |  | ||||||
|  | import numpy | ||||||
|  | import cStringIO | ||||||
|  |  | ||||||
|  | def layout_to_dtype(layout): | ||||||
|  |     ltype = layout.split('_')[0] | ||||||
|  |     lcount = int(layout.split('_')[1]) | ||||||
|  |     if ltype.startswith('int'): | ||||||
|  |         atype = '<i' + str(int(ltype[3:]) / 8) | ||||||
|  |     elif ltype.startswith('uint'): | ||||||
|  |         atype = '<u' + str(int(ltype[4:]) / 8) | ||||||
|  |     elif ltype.startswith('float'): | ||||||
|  |         atype = '<f' + str(int(ltype[5:]) / 8) | ||||||
|  |     else: | ||||||
|  |         raise ValueError("bad layout") | ||||||
|  |     return numpy.dtype([('timestamp', '<i8'), ('data', atype, lcount)]) | ||||||
|  |  | ||||||
|  | class NumpyClient(nilmdb.client.client.Client): | ||||||
|  |     """Subclass of nilmdb.client.Client that adds additional methods for | ||||||
|  |     extracting and inserting data via Numpy arrays.""" | ||||||
|  |  | ||||||
|  |     def _get_dtype(self, path, layout): | ||||||
|  |         if layout is None: | ||||||
|  |             streams = self.stream_list(path) | ||||||
|  |             if len(streams) != 1: | ||||||
|  |                 raise ClientError("can't get layout for path: " + path) | ||||||
|  |             layout = streams[0][1] | ||||||
|  |         return layout_to_dtype(layout) | ||||||
|  |  | ||||||
|  |     def stream_extract_numpy(self, path, start = None, end = None, | ||||||
|  |                              layout = None, maxrows = 100000, | ||||||
|  |                              structured = False): | ||||||
|  |         """ | ||||||
|  |         Extract data from a stream.  Returns a generator that yields | ||||||
|  |         Numpy arrays of up to 'maxrows' of data each. | ||||||
|  |  | ||||||
|  |         If 'layout' is None, it is read using stream_info. | ||||||
|  |  | ||||||
|  |         If 'structured' is False, all data is converted to float64 | ||||||
|  |         and returned in a flat 2D array.  Otherwise, data is returned | ||||||
|  |         as a structured dtype in a 1D array. | ||||||
|  |         """ | ||||||
|  |         dtype = self._get_dtype(path, layout) | ||||||
|  |  | ||||||
|  |         def to_numpy(data): | ||||||
|  |             a = numpy.fromstring(data, dtype) | ||||||
|  |             if structured: | ||||||
|  |                 return a | ||||||
|  |             return numpy.c_[a['timestamp'], a['data']] | ||||||
|  |  | ||||||
|  |         chunks = [] | ||||||
|  |         total_len = 0 | ||||||
|  |         maxsize = dtype.itemsize * maxrows | ||||||
|  |         for data in self.stream_extract(path, start, end, binary = True): | ||||||
|  |             # Add this block of binary data | ||||||
|  |             chunks.append(data) | ||||||
|  |             total_len += len(data) | ||||||
|  |  | ||||||
|  |             # See if we have enough to make the requested Numpy array | ||||||
|  |             while total_len >= maxsize: | ||||||
|  |                 assembled = "".join(chunks) | ||||||
|  |                 total_len -= maxsize | ||||||
|  |                 chunks = [ assembled[maxsize:] ] | ||||||
|  |                 block = assembled[:maxsize] | ||||||
|  |                 yield to_numpy(block) | ||||||
|  |  | ||||||
|  |         if total_len: | ||||||
|  |             yield to_numpy("".join(chunks)) | ||||||
|  |  | ||||||
|  |     @contextlib.contextmanager | ||||||
|  |     def stream_insert_numpy_context(self, path, start = None, end = None, | ||||||
|  |                                     layout = None): | ||||||
|  |         """Return a context manager that allows data to be efficiently | ||||||
|  |         inserted into a stream in a piecewise manner.  Data is | ||||||
|  |         provided as Numpy arrays, and is aggregated and sent to the | ||||||
|  |         server in larger or smaller chunks as necessary.  Data format | ||||||
|  |         must match the database layout for the given path. | ||||||
|  |  | ||||||
|  |         For more details, see help for | ||||||
|  |         nilmdb.client.numpyclient.StreamInserterNumpy | ||||||
|  |  | ||||||
|  |         If 'layout' is not None, use it as the layout rather than | ||||||
|  |         querying the database. | ||||||
|  |         """ | ||||||
|  |         dtype = self._get_dtype(path, layout) | ||||||
|  |         ctx = StreamInserterNumpy(self, path, start, end, dtype) | ||||||
|  |         yield ctx | ||||||
|  |         ctx.finalize() | ||||||
|  |         ctx.destroy() | ||||||
|  |  | ||||||
|  |     def stream_insert_numpy(self, path, data, start = None, end = None, | ||||||
|  |                             layout = None): | ||||||
|  |         """Insert data into a stream.  data should be a Numpy array | ||||||
|  |         which will be passed through stream_insert_numpy_context to | ||||||
|  |         break it into chunks etc.  See the help for that function | ||||||
|  |         for details.""" | ||||||
|  |         with self.stream_insert_numpy_context(path, start, end, layout) as ctx: | ||||||
|  |             if isinstance(data, numpy.ndarray): | ||||||
|  |                 ctx.insert(data) | ||||||
|  |             else: | ||||||
|  |                 for chunk in data: | ||||||
|  |                     ctx.insert(chunk) | ||||||
|  |         return ctx.last_response | ||||||
|  |  | ||||||
|  | class StreamInserterNumpy(nilmdb.client.client.StreamInserter): | ||||||
|  |     """Object returned by stream_insert_numpy_context() that manages | ||||||
|  |     the insertion of rows of data into a particular path. | ||||||
|  |  | ||||||
|  |     See help for nilmdb.client.client.StreamInserter for details. | ||||||
|  |     The only difference is that, instead of ASCII formatted data, | ||||||
|  |     this context manager can take Numpy arrays, which are either | ||||||
|  |     structured (1D with complex dtype) or flat (2D with simple dtype). | ||||||
|  |     """ | ||||||
|  |  | ||||||
|  |     # Soft limit of how many bytes to send per HTTP request. | ||||||
|  |     _max_data = 2 * 1024 * 1024 | ||||||
|  |  | ||||||
|  |     def __init__(self, client, path, start, end, dtype): | ||||||
|  |         """ | ||||||
|  |         'client' is the client object.  'path' is the database path | ||||||
|  |         to insert to.  'start' and 'end' are used for the first | ||||||
|  |         contiguous interval and may be None.  'dtype' is the Numpy | ||||||
|  |         dtype for this stream. | ||||||
|  |         """ | ||||||
|  |         super(StreamInserterNumpy, self).__init__(client, path, start, end) | ||||||
|  |         self._dtype = dtype | ||||||
|  |  | ||||||
|  |         # Max rows to send at once | ||||||
|  |         self._max_rows = self._max_data // self._dtype.itemsize | ||||||
|  |  | ||||||
|  |         # List of the current arrays we're building up to send | ||||||
|  |         self._block_arrays = [] | ||||||
|  |         self._block_rows = 0 | ||||||
|  |  | ||||||
|  |     def insert(self, array): | ||||||
|  |         """Insert Numpy data, which must match the layout type.""" | ||||||
|  |         if type(array) != numpy.ndarray: | ||||||
|  |             array = numpy.array(array) | ||||||
|  |         if array.ndim == 1: | ||||||
|  |             # Already a structured array; just verify the type | ||||||
|  |             if array.dtype != self._dtype: | ||||||
|  |                 raise ValueError("wrong dtype for 1D (structured) array") | ||||||
|  |         elif array.ndim == 2: | ||||||
|  |             # Convert to structured array | ||||||
|  |             sarray = numpy.zeros(array.shape[0], dtype=self._dtype) | ||||||
|  |             try: | ||||||
|  |                 sarray['timestamp'] = array[:,0] | ||||||
|  |                 # Need the squeeze in case sarray['data'] is 1 dimensional | ||||||
|  |                 sarray['data'] = numpy.squeeze(array[:,1:]) | ||||||
|  |             except (IndexError, ValueError): | ||||||
|  |                 raise ValueError("wrong number of fields for this data type") | ||||||
|  |             array = sarray | ||||||
|  |         else: | ||||||
|  |             raise ValueError("wrong number of dimensions in array") | ||||||
|  |  | ||||||
|  |         length = len(array) | ||||||
|  |         maxrows = self._max_rows | ||||||
|  |  | ||||||
|  |         if length == 0: | ||||||
|  |             return | ||||||
|  |         if length > maxrows: | ||||||
|  |             # This is more than twice what we wanted to send, so split | ||||||
|  |             # it up.  This is a bit inefficient, but the user really | ||||||
|  |             # shouldn't be providing this much data at once. | ||||||
|  |             for cut in range(0, length, maxrows): | ||||||
|  |                 self.insert(array[cut:(cut + maxrows)]) | ||||||
|  |             return | ||||||
|  |  | ||||||
|  |         # Add this array to our list | ||||||
|  |         self._block_arrays.append(array) | ||||||
|  |         self._block_rows += length | ||||||
|  |  | ||||||
|  |         # Send if it's too long | ||||||
|  |         if self._block_rows >= maxrows: | ||||||
|  |             self._send_block(final = False) | ||||||
|  |  | ||||||
|  |     def _send_block(self, final = False): | ||||||
|  |         """Send the data current stored up.  One row might be left | ||||||
|  |         over if we need its timestamp saved.""" | ||||||
|  |  | ||||||
|  |         # Build the full array to send | ||||||
|  |         if self._block_rows == 0: | ||||||
|  |             array = numpy.zeros(0, dtype = self._dtype) | ||||||
|  |         else: | ||||||
|  |             array = numpy.hstack(self._block_arrays) | ||||||
|  |  | ||||||
|  |         # Get starting timestamp | ||||||
|  |         start_ts = self._interval_start | ||||||
|  |         if start_ts is None: | ||||||
|  |             # Pull start from the first row | ||||||
|  |             try: | ||||||
|  |                 start_ts = array['timestamp'][0] | ||||||
|  |             except IndexError: | ||||||
|  |                 pass # no timestamp is OK, if we have no data | ||||||
|  |  | ||||||
|  |         # Get ending timestamp | ||||||
|  |         if final: | ||||||
|  |             # For a final block, the timestamp is either the | ||||||
|  |             # user-provided end, or the timestamp of the last line | ||||||
|  |             # plus epsilon. | ||||||
|  |             end_ts = self._interval_end | ||||||
|  |             if end_ts is None: | ||||||
|  |                 try: | ||||||
|  |                     end_ts = array['timestamp'][-1] | ||||||
|  |                     end_ts += nilmdb.utils.time.epsilon | ||||||
|  |                 except IndexError: | ||||||
|  |                     pass # no timestamp is OK, if we have no data | ||||||
|  |             self._block_arrays = [] | ||||||
|  |             self._block_rows = 0 | ||||||
|  |  | ||||||
|  |             # Next block is completely fresh | ||||||
|  |             self._interval_start = None | ||||||
|  |             self._interval_end = None | ||||||
|  |         else: | ||||||
|  |             # An intermediate block.  We need to save the last row | ||||||
|  |             # for the next block, and use its timestamp as the ending | ||||||
|  |             # timestamp for this one. | ||||||
|  |             if len(array) < 2: | ||||||
|  |                 # Not enough data to send an intermediate block | ||||||
|  |                 return | ||||||
|  |             end_ts = array['timestamp'][-1] | ||||||
|  |             if self._interval_end is not None and end_ts > self._interval_end: | ||||||
|  |                 # User gave us bad endpoints; send it anyway, and let | ||||||
|  |                 # the server complain so that the error is the same | ||||||
|  |                 # as if we hadn't done this chunking. | ||||||
|  |                 end_ts = self._interval_end | ||||||
|  |             self._block_arrays = [ array[-1:] ] | ||||||
|  |             self._block_rows = 1 | ||||||
|  |             array = array[:-1] | ||||||
|  |  | ||||||
|  |             # Next block continues where this one ended | ||||||
|  |             self._interval_start = end_ts | ||||||
|  |  | ||||||
|  |         # If we have no endpoints, or equal endpoints, it's OK as long | ||||||
|  |         # as there's no data to send | ||||||
|  |         if (start_ts is None or end_ts is None) or (start_ts == end_ts): | ||||||
|  |             if len(array) == 0: | ||||||
|  |                 return | ||||||
|  |             raise ClientError("have data to send, but invalid start/end times") | ||||||
|  |  | ||||||
|  |         # Send it | ||||||
|  |         data = array.tostring() | ||||||
|  |         self.last_response = self._client.stream_insert_block( | ||||||
|  |             self._path, data, start_ts, end_ts, binary = True) | ||||||
|  |  | ||||||
|  |         return | ||||||
| @@ -10,6 +10,7 @@ import sys | |||||||
| import os | import os | ||||||
| import argparse | import argparse | ||||||
| from argparse import ArgumentDefaultsHelpFormatter as def_form | from argparse import ArgumentDefaultsHelpFormatter as def_form | ||||||
|  | import signal | ||||||
|  |  | ||||||
| try: # pragma: no cover | try: # pragma: no cover | ||||||
|     import argcomplete |     import argcomplete | ||||||
| @@ -28,6 +29,14 @@ for cmd in subcommands: | |||||||
|     subcmd_mods[cmd] = __import__("nilmdb.cmdline." + cmd, fromlist = [ cmd ]) |     subcmd_mods[cmd] = __import__("nilmdb.cmdline." + cmd, fromlist = [ cmd ]) | ||||||
|  |  | ||||||
| class JimArgumentParser(argparse.ArgumentParser): | class JimArgumentParser(argparse.ArgumentParser): | ||||||
|  |     def parse_args(self, args=None, namespace=None): | ||||||
|  |         # Look for --version anywhere and change it to just "nilmtool | ||||||
|  |         # --version".  This makes "nilmtool cmd --version" work, which | ||||||
|  |         # is needed by help2man. | ||||||
|  |         if "--version" in (args or sys.argv[1:]): | ||||||
|  |             args = [ "--version" ] | ||||||
|  |         return argparse.ArgumentParser.parse_args(self, args, namespace) | ||||||
|  |  | ||||||
|     def error(self, message): |     def error(self, message): | ||||||
|         self.print_usage(sys.stderr) |         self.print_usage(sys.stderr) | ||||||
|         self.exit(2, sprintf("error: %s\n", message)) |         self.exit(2, sprintf("error: %s\n", message)) | ||||||
| @@ -71,17 +80,29 @@ class Complete(object): # pragma: no cover | |||||||
|         path = parsed_args.path |         path = parsed_args.path | ||||||
|         if not path: |         if not path: | ||||||
|             return [] |             return [] | ||||||
|         return ( self.escape(k + '=' + v) |         results = [] | ||||||
|                  for (k,v) in client.stream_get_metadata(path).iteritems() |         # prefix comes in as UTF-8, but results need to be Unicode, | ||||||
|                  if k.startswith(prefix) ) |         # weird.  Still doesn't work in all cases, but that's bugs in | ||||||
|  |         # argcomplete. | ||||||
|  |         prefix = nilmdb.utils.unicode.decode(prefix) | ||||||
|  |         for (k,v) in client.stream_get_metadata(path).iteritems(): | ||||||
|  |             kv = self.escape(k + '=' + v) | ||||||
|  |             if kv.startswith(prefix): | ||||||
|  |                 results.append(kv) | ||||||
|  |         return results | ||||||
|  |  | ||||||
| class Cmdline(object): | class Cmdline(object): | ||||||
|  |  | ||||||
|     def __init__(self, argv = None): |     def __init__(self, argv = None): | ||||||
|         self.argv = argv or sys.argv[1:] |         self.argv = argv or sys.argv[1:] | ||||||
|  |         try: | ||||||
|  |             # Assume command line arguments are encoded with stdin's encoding, | ||||||
|  |             # and reverse it.  Won't be needed in Python 3, but for now.. | ||||||
|  |             self.argv = [ x.decode(sys.stdin.encoding) for x in self.argv ] | ||||||
|  |         except Exception: # pragma: no cover | ||||||
|  |             pass | ||||||
|         self.client = None |         self.client = None | ||||||
|         self.def_url = os.environ.get("NILMDB_URL", "http://localhost:12380") |         self.def_url = os.environ.get("NILMDB_URL", "http://localhost/nilmdb/") | ||||||
|         self.subcmd = {} |         self.subcmd = {} | ||||||
|         self.complete = Complete() |         self.complete = Complete() | ||||||
|  |  | ||||||
| @@ -126,6 +147,13 @@ class Cmdline(object): | |||||||
|         sys.exit(-1) |         sys.exit(-1) | ||||||
|  |  | ||||||
|     def run(self): |     def run(self): | ||||||
|  |         # Set SIGPIPE to its default handler -- we don't need Python | ||||||
|  |         # to catch it for us. | ||||||
|  |         try: | ||||||
|  |             signal.signal(signal.SIGPIPE, signal.SIG_DFL) | ||||||
|  |         except ValueError: # pragma: no cover | ||||||
|  |             pass | ||||||
|  |  | ||||||
|         # Clear cached timezone, so that we can pick up timezone changes |         # Clear cached timezone, so that we can pick up timezone changes | ||||||
|         # while running this from the test suite. |         # while running this from the test suite. | ||||||
|         datetime_tz._localtz = None |         datetime_tz._localtz = None | ||||||
|   | |||||||
| @@ -1,5 +1,6 @@ | |||||||
| from nilmdb.utils.printf import * | from nilmdb.utils.printf import * | ||||||
| import nilmdb.client | import nilmdb.client | ||||||
|  | import fnmatch | ||||||
|  |  | ||||||
| from argparse import ArgumentDefaultsHelpFormatter as def_form | from argparse import ArgumentDefaultsHelpFormatter as def_form | ||||||
|  |  | ||||||
| @@ -7,20 +8,42 @@ def setup(self, sub): | |||||||
|     cmd = sub.add_parser("destroy", help="Delete a stream and all data", |     cmd = sub.add_parser("destroy", help="Delete a stream and all data", | ||||||
|                          formatter_class = def_form, |                          formatter_class = def_form, | ||||||
|                          description=""" |                          description=""" | ||||||
|                          Destroy the stream at the specified path.  All |                          Destroy the stream at the specified path. | ||||||
|                          data and metadata related to the stream is |                          The stream must be empty.  All metadata | ||||||
|                          permanently deleted. |                          related to the stream is permanently deleted. | ||||||
|  |  | ||||||
|  |                          Wildcards and multiple paths are supported. | ||||||
|                          """) |                          """) | ||||||
|     cmd.set_defaults(handler = cmd_destroy) |     cmd.set_defaults(handler = cmd_destroy) | ||||||
|  |     group = cmd.add_argument_group("Options") | ||||||
|  |     group.add_argument("-R", "--remove", action="store_true", | ||||||
|  |                        help="Remove all data before destroying stream") | ||||||
|  |     group.add_argument("-q", "--quiet", action="store_true", | ||||||
|  |                        help="Don't display names when destroying " | ||||||
|  |                        "multiple paths") | ||||||
|     group = cmd.add_argument_group("Required arguments") |     group = cmd.add_argument_group("Required arguments") | ||||||
|     group.add_argument("path", |     group.add_argument("path", nargs='+', | ||||||
|                        help="Path of the stream to delete, e.g. /foo/bar", |                        help="Path of the stream to delete, e.g. /foo/bar/*", | ||||||
|                        ).completer = self.complete.path |                        ).completer = self.complete.path | ||||||
|     return cmd |     return cmd | ||||||
|  |  | ||||||
| def cmd_destroy(self): | def cmd_destroy(self): | ||||||
|     """Destroy stream""" |     """Destroy stream""" | ||||||
|  |     streams = [ s[0] for s in self.client.stream_list() ] | ||||||
|  |     paths = [] | ||||||
|  |     for path in self.args.path: | ||||||
|  |         new = fnmatch.filter(streams, path) | ||||||
|  |         if not new: | ||||||
|  |             self.die("error: no stream matched path: %s", path) | ||||||
|  |         paths.extend(new) | ||||||
|  |  | ||||||
|  |     for path in paths: | ||||||
|  |         if not self.args.quiet and len(paths) > 1: | ||||||
|  |             printf("Destroying %s\n", path) | ||||||
|  |  | ||||||
|         try: |         try: | ||||||
|         self.client.stream_destroy(self.args.path) |             if self.args.remove: | ||||||
|  |                 count = self.client.stream_remove(path) | ||||||
|  |             self.client.stream_destroy(path) | ||||||
|         except nilmdb.client.ClientError as e: |         except nilmdb.client.ClientError as e: | ||||||
|             self.die("error destroying stream: %s", str(e)) |             self.die("error destroying stream: %s", str(e)) | ||||||
|   | |||||||
| @@ -1,6 +1,7 @@ | |||||||
| from __future__ import print_function | from __future__ import print_function | ||||||
| from nilmdb.utils.printf import * | from nilmdb.utils.printf import * | ||||||
| import nilmdb.client | import nilmdb.client | ||||||
|  | import sys | ||||||
|  |  | ||||||
| def setup(self, sub): | def setup(self, sub): | ||||||
|     cmd = sub.add_parser("extract", help="Extract data", |     cmd = sub.add_parser("extract", help="Extract data", | ||||||
| @@ -24,11 +25,15 @@ def setup(self, sub): | |||||||
|                        ).completer = self.complete.time |                        ).completer = self.complete.time | ||||||
|  |  | ||||||
|     group = cmd.add_argument_group("Output format") |     group = cmd.add_argument_group("Output format") | ||||||
|  |     group.add_argument("-B", "--binary", action="store_true", | ||||||
|  |                        help="Raw binary output") | ||||||
|     group.add_argument("-b", "--bare", action="store_true", |     group.add_argument("-b", "--bare", action="store_true", | ||||||
|                        help="Exclude timestamps from output lines") |                        help="Exclude timestamps from output lines") | ||||||
|     group.add_argument("-a", "--annotate", action="store_true", |     group.add_argument("-a", "--annotate", action="store_true", | ||||||
|                        help="Include comments with some information " |                        help="Include comments with some information " | ||||||
|                        "about the stream") |                        "about the stream") | ||||||
|  |     group.add_argument("-m", "--markup", action="store_true", | ||||||
|  |                        help="Include comments with interval starts and ends") | ||||||
|     group.add_argument("-T", "--timestamp-raw", action="store_true", |     group.add_argument("-T", "--timestamp-raw", action="store_true", | ||||||
|                        help="Show raw timestamps in annotated information") |                        help="Show raw timestamps in annotated information") | ||||||
|     group.add_argument("-c", "--count", action="store_true", |     group.add_argument("-c", "--count", action="store_true", | ||||||
| @@ -40,6 +45,11 @@ def cmd_extract_verify(self): | |||||||
|         if self.args.start > self.args.end: |         if self.args.start > self.args.end: | ||||||
|             self.parser.error("start is after end") |             self.parser.error("start is after end") | ||||||
|  |  | ||||||
|  |     if self.args.binary: | ||||||
|  |         if (self.args.bare or self.args.annotate or self.args.markup or | ||||||
|  |             self.args.timestamp_raw or self.args.count): | ||||||
|  |             self.parser.error("--binary cannot be combined with other options") | ||||||
|  |  | ||||||
| def cmd_extract(self): | def cmd_extract(self): | ||||||
|     streams = self.client.stream_list(self.args.path) |     streams = self.client.stream_list(self.args.path) | ||||||
|     if len(streams) != 1: |     if len(streams) != 1: | ||||||
| @@ -58,15 +68,23 @@ def cmd_extract(self): | |||||||
|         printf("# end: %s\n", time_string(self.args.end)) |         printf("# end: %s\n", time_string(self.args.end)) | ||||||
|  |  | ||||||
|     printed = False |     printed = False | ||||||
|  |     if self.args.binary: | ||||||
|  |         printer = sys.stdout.write | ||||||
|  |     else: | ||||||
|  |         printer = print | ||||||
|  |     bare = self.args.bare | ||||||
|  |     count = self.args.count | ||||||
|     for dataline in self.client.stream_extract(self.args.path, |     for dataline in self.client.stream_extract(self.args.path, | ||||||
|                                                self.args.start, |                                                self.args.start, | ||||||
|                                                self.args.end, |                                                self.args.end, | ||||||
|                                                self.args.count): |                                                self.args.count, | ||||||
|         if self.args.bare and not self.args.count: |                                                self.args.markup, | ||||||
|  |                                                self.args.binary): | ||||||
|  |         if bare and not count: | ||||||
|             # Strip timestamp (first element).  Doesn't make sense |             # Strip timestamp (first element).  Doesn't make sense | ||||||
|             # if we are only returning a count. |             # if we are only returning a count. | ||||||
|             dataline = ' '.join(dataline.split(' ')[1:]) |             dataline = ' '.join(dataline.split(' ')[1:]) | ||||||
|         print(dataline) |         printer(dataline) | ||||||
|         printed = True |         printed = True | ||||||
|     if not printed: |     if not printed: | ||||||
|         if self.args.annotate: |         if self.args.annotate: | ||||||
|   | |||||||
| @@ -21,5 +21,8 @@ def cmd_info(self): | |||||||
|     printf("Server URL: %s\n", self.client.geturl()) |     printf("Server URL: %s\n", self.client.geturl()) | ||||||
|     dbinfo = self.client.dbinfo() |     dbinfo = self.client.dbinfo() | ||||||
|     printf("Server database path: %s\n", dbinfo["path"]) |     printf("Server database path: %s\n", dbinfo["path"]) | ||||||
|     printf("Server database size: %s\n", human_size(dbinfo["size"])) |     for (desc, field) in [("used by NilmDB", "size"), | ||||||
|     printf("Server database free space: %s\n", human_size(dbinfo["free"])) |                           ("used by other", "other"), | ||||||
|  |                           ("reserved", "reserved"), | ||||||
|  |                           ("free", "free")]: | ||||||
|  |         printf("Server disk space %s: %s\n", desc, human_size(dbinfo[field])) | ||||||
|   | |||||||
| @@ -1,5 +1,6 @@ | |||||||
| from nilmdb.utils.printf import * | from nilmdb.utils.printf import * | ||||||
| import nilmdb.utils.time | import nilmdb.utils.time | ||||||
|  | from nilmdb.utils.interval import Interval | ||||||
|  |  | ||||||
| import fnmatch | import fnmatch | ||||||
| import argparse | import argparse | ||||||
| @@ -42,6 +43,8 @@ def setup(self, sub): | |||||||
|     group = cmd.add_argument_group("Misc options") |     group = cmd.add_argument_group("Misc options") | ||||||
|     group.add_argument("-T", "--timestamp-raw", action="store_true", |     group.add_argument("-T", "--timestamp-raw", action="store_true", | ||||||
|                        help="Show raw timestamps when printing times") |                        help="Show raw timestamps when printing times") | ||||||
|  |     group.add_argument("-o", "--optimize", action="store_true", | ||||||
|  |                        help="Optimize (merge adjacent) intervals") | ||||||
|  |  | ||||||
|     return cmd |     return cmd | ||||||
|  |  | ||||||
| @@ -58,9 +61,16 @@ def cmd_intervals(self): | |||||||
|         time_string = nilmdb.utils.time.timestamp_to_human |         time_string = nilmdb.utils.time.timestamp_to_human | ||||||
|  |  | ||||||
|     try: |     try: | ||||||
|            for (start, end) in self.client.stream_intervals( |         intervals = ( Interval(start, end) for (start, end) in | ||||||
|                self.args.path, self.args.start, self.args.end, self.args.diff): |                       self.client.stream_intervals(self.args.path, | ||||||
|                printf("[ %s -> %s ]\n", time_string(start), time_string(end)) |                                                    self.args.start, | ||||||
|  |                                                    self.args.end, | ||||||
|  |                                                    self.args.diff) ) | ||||||
|  |         if self.args.optimize: | ||||||
|  |             intervals = nilmdb.utils.interval.optimize(intervals) | ||||||
|  |         for i in intervals: | ||||||
|  |             printf("[ %s -> %s ]\n", time_string(i.start), time_string(i.end)) | ||||||
|  |  | ||||||
|     except nilmdb.client.ClientError as e: |     except nilmdb.client.ClientError as e: | ||||||
|         self.die("error listing intervals: %s", str(e)) |         self.die("error listing intervals: %s", str(e)) | ||||||
|  |  | ||||||
|   | |||||||
| @@ -10,22 +10,16 @@ def setup(self, sub): | |||||||
|                          formatter_class = def_form, |                          formatter_class = def_form, | ||||||
|                          description=""" |                          description=""" | ||||||
|                          List streams available in the database, |                          List streams available in the database, | ||||||
|                          optionally filtering by layout or path.  Wildcards |                          optionally filtering by path.  Wildcards | ||||||
|                          are accepted. |                          are accepted; non-matching paths or wildcards | ||||||
|  |                          are ignored. | ||||||
|                          """) |                          """) | ||||||
|     cmd.set_defaults(verify = cmd_list_verify, |     cmd.set_defaults(verify = cmd_list_verify, | ||||||
|                      handler = cmd_list) |                      handler = cmd_list) | ||||||
|  |  | ||||||
|     group = cmd.add_argument_group("Stream filtering") |     group = cmd.add_argument_group("Stream filtering") | ||||||
|     group.add_argument("-p", "--path", metavar="PATH", default="*", |     group.add_argument("path", metavar="PATH", default=["*"], nargs='*', | ||||||
|                        help="Match only this path (-p can be omitted)", |  | ||||||
|                        ).completer = self.complete.path |                        ).completer = self.complete.path | ||||||
|     group.add_argument("path_positional", default="*", |  | ||||||
|                        nargs="?", help=argparse.SUPPRESS, |  | ||||||
|                        ).completer = self.complete.path |  | ||||||
|     group.add_argument("-l", "--layout", default="*", |  | ||||||
|                        help="Match only this stream layout", |  | ||||||
|                        ).completer = self.complete.layout |  | ||||||
|  |  | ||||||
|     group = cmd.add_argument_group("Interval info") |     group = cmd.add_argument_group("Interval info") | ||||||
|     group.add_argument("-E", "--ext", action="store_true", |     group.add_argument("-E", "--ext", action="store_true", | ||||||
| @@ -49,20 +43,12 @@ def setup(self, sub): | |||||||
|     group = cmd.add_argument_group("Misc options") |     group = cmd.add_argument_group("Misc options") | ||||||
|     group.add_argument("-T", "--timestamp-raw", action="store_true", |     group.add_argument("-T", "--timestamp-raw", action="store_true", | ||||||
|                        help="Show raw timestamps when printing times") |                        help="Show raw timestamps when printing times") | ||||||
|  |     group.add_argument("-l", "--layout", action="store_true", | ||||||
|  |                        help="Show layout type next to path name") | ||||||
|  |  | ||||||
|     return cmd |     return cmd | ||||||
|  |  | ||||||
| def cmd_list_verify(self): | def cmd_list_verify(self): | ||||||
|     # A hidden "path_positional" argument lets the user leave off the |  | ||||||
|     # "-p" when specifying the path.  Handle it here. |  | ||||||
|     got_opt = self.args.path != "*" |  | ||||||
|     got_pos = self.args.path_positional != "*" |  | ||||||
|     if got_pos: |  | ||||||
|         if got_opt: |  | ||||||
|             self.parser.error("too many paths specified") |  | ||||||
|         else: |  | ||||||
|             self.args.path = self.args.path_positional |  | ||||||
|  |  | ||||||
|     if self.args.start is not None and self.args.end is not None: |     if self.args.start is not None and self.args.end is not None: | ||||||
|         if self.args.start >= self.args.end: |         if self.args.start >= self.args.end: | ||||||
|             self.parser.error("start must precede end") |             self.parser.error("start must precede end") | ||||||
| @@ -80,13 +66,16 @@ def cmd_list(self): | |||||||
|     else: |     else: | ||||||
|         time_string = nilmdb.utils.time.timestamp_to_human |         time_string = nilmdb.utils.time.timestamp_to_human | ||||||
|  |  | ||||||
|  |     for argpath in self.args.path: | ||||||
|         for stream in streams: |         for stream in streams: | ||||||
|             (path, layout, int_min, int_max, rows, time) = stream[:6] |             (path, layout, int_min, int_max, rows, time) = stream[:6] | ||||||
|         if not (fnmatch.fnmatch(path, self.args.path) and |             if not fnmatch.fnmatch(path, argpath): | ||||||
|                 fnmatch.fnmatch(layout, self.args.layout)): |  | ||||||
|                 continue |                 continue | ||||||
|  |  | ||||||
|  |             if self.args.layout: | ||||||
|                 printf("%s %s\n", path, layout) |                 printf("%s %s\n", path, layout) | ||||||
|  |             else: | ||||||
|  |                 printf("%s\n", path) | ||||||
|  |  | ||||||
|             if self.args.ext: |             if self.args.ext: | ||||||
|                 if int_min is None or int_max is None: |                 if int_min is None or int_max is None: | ||||||
| @@ -102,7 +91,8 @@ def cmd_list(self): | |||||||
|                 printed = False |                 printed = False | ||||||
|                 for (start, end) in self.client.stream_intervals( |                 for (start, end) in self.client.stream_intervals( | ||||||
|                     path, self.args.start, self.args.end): |                     path, self.args.start, self.args.end): | ||||||
|                 printf("  [ %s -> %s ]\n", time_string(start), time_string(end)) |                     printf("  [ %s -> %s ]\n", | ||||||
|  |                            time_string(start), time_string(end)) | ||||||
|                     printed = True |                     printed = True | ||||||
|                 if not printed: |                 if not printed: | ||||||
|                     printf("  (no intervals)\n") |                     printf("  (no intervals)\n") | ||||||
|   | |||||||
| @@ -9,7 +9,8 @@ def setup(self, sub): | |||||||
|                          a stream. |                          a stream. | ||||||
|                          """, |                          """, | ||||||
|                          usage="%(prog)s path [-g [key ...] | " |                          usage="%(prog)s path [-g [key ...] | " | ||||||
|                          "-s key=value [...] | -u key=value [...]]") |                          "-s key=value [...] | -u key=value [...]] | " | ||||||
|  |                          "-d [key ...]") | ||||||
|     cmd.set_defaults(handler = cmd_metadata) |     cmd.set_defaults(handler = cmd_metadata) | ||||||
|  |  | ||||||
|     group = cmd.add_argument_group("Required arguments") |     group = cmd.add_argument_group("Required arguments") | ||||||
| @@ -30,6 +31,9 @@ def setup(self, sub): | |||||||
|                      help="Update metadata using provided " |                      help="Update metadata using provided " | ||||||
|                      "key=value pairs", |                      "key=value pairs", | ||||||
|                      ).completer = self.complete.meta_keyval |                      ).completer = self.complete.meta_keyval | ||||||
|  |     exc.add_argument("-d", "--delete", nargs="*", metavar="key", | ||||||
|  |                      help="Delete metadata for specified keys (default all)", | ||||||
|  |                      ).completer = self.complete.meta_key | ||||||
|     return cmd |     return cmd | ||||||
|  |  | ||||||
| def cmd_metadata(self): | def cmd_metadata(self): | ||||||
| @@ -37,10 +41,10 @@ def cmd_metadata(self): | |||||||
|     if self.args.set is not None or self.args.update is not None: |     if self.args.set is not None or self.args.update is not None: | ||||||
|         # Either set, or update |         # Either set, or update | ||||||
|         if self.args.set is not None: |         if self.args.set is not None: | ||||||
|             keyvals = self.args.set |             keyvals = map(nilmdb.utils.unicode.decode, self.args.set) | ||||||
|             handler = self.client.stream_set_metadata |             handler = self.client.stream_set_metadata | ||||||
|         else: |         else: | ||||||
|             keyvals = self.args.update |             keyvals = map(nilmdb.utils.unicode.decode, self.args.update) | ||||||
|             handler = self.client.stream_update_metadata |             handler = self.client.stream_update_metadata | ||||||
|  |  | ||||||
|         # Extract key=value pairs |         # Extract key=value pairs | ||||||
| @@ -56,15 +60,31 @@ def cmd_metadata(self): | |||||||
|             handler(self.args.path, data) |             handler(self.args.path, data) | ||||||
|         except nilmdb.client.ClientError as e: |         except nilmdb.client.ClientError as e: | ||||||
|             self.die("error setting/updating metadata: %s", str(e)) |             self.die("error setting/updating metadata: %s", str(e)) | ||||||
|  |     elif self.args.delete is not None: | ||||||
|  |         # Delete (by setting values to empty strings) | ||||||
|  |         keys = None | ||||||
|  |         if self.args.delete: | ||||||
|  |             keys = map(nilmdb.utils.unicode.decode, self.args.delete) | ||||||
|  |         try: | ||||||
|  |             data = self.client.stream_get_metadata(self.args.path, keys) | ||||||
|  |             for key in data: | ||||||
|  |                 data[key] = "" | ||||||
|  |             self.client.stream_update_metadata(self.args.path, data) | ||||||
|  |         except nilmdb.client.ClientError as e: | ||||||
|  |             self.die("error deleting metadata: %s", str(e)) | ||||||
|     else: |     else: | ||||||
|         # Get (or unspecified) |         # Get (or unspecified) | ||||||
|         keys = self.args.get or None |         keys = None | ||||||
|  |         if self.args.get: | ||||||
|  |             keys = map(nilmdb.utils.unicode.decode, self.args.get) | ||||||
|         try: |         try: | ||||||
|             data = self.client.stream_get_metadata(self.args.path, keys) |             data = self.client.stream_get_metadata(self.args.path, keys) | ||||||
|         except nilmdb.client.ClientError as e: |         except nilmdb.client.ClientError as e: | ||||||
|             self.die("error getting metadata: %s", str(e)) |             self.die("error getting metadata: %s", str(e)) | ||||||
|         for key, value in sorted(data.items()): |         for key, value in sorted(data.items()): | ||||||
|             # Omit nonexistant keys |             # Print nonexistant keys as having empty value | ||||||
|             if value is None: |             if value is None: | ||||||
|                 value = "" |                 value = "" | ||||||
|             printf("%s=%s\n", key, value) |             printf("%s=%s\n", | ||||||
|  |                    nilmdb.utils.unicode.encode(key), | ||||||
|  |                    nilmdb.utils.unicode.encode(value)) | ||||||
|   | |||||||
| @@ -1,17 +1,19 @@ | |||||||
| from nilmdb.utils.printf import * | from nilmdb.utils.printf import * | ||||||
| import nilmdb.client | import nilmdb.client | ||||||
|  | import fnmatch | ||||||
|  |  | ||||||
| def setup(self, sub): | def setup(self, sub): | ||||||
|     cmd = sub.add_parser("remove", help="Remove data", |     cmd = sub.add_parser("remove", help="Remove data", | ||||||
|                          description=""" |                          description=""" | ||||||
|                          Remove all data from a specified time range within a |                          Remove all data from a specified time range within a | ||||||
|                          stream. |                          stream.  If multiple streams or wildcards are provided, | ||||||
|  |                          the same time range is removed from all streams. | ||||||
|                          """) |                          """) | ||||||
|     cmd.set_defaults(handler = cmd_remove) |     cmd.set_defaults(handler = cmd_remove) | ||||||
|  |  | ||||||
|     group = cmd.add_argument_group("Data selection") |     group = cmd.add_argument_group("Data selection") | ||||||
|     group.add_argument("path", |     group.add_argument("path", nargs='+', | ||||||
|                        help="Path of stream, e.g. /foo/bar", |                        help="Path of stream, e.g. /foo/bar/*", | ||||||
|                        ).completer = self.complete.path |                        ).completer = self.complete.path | ||||||
|     group.add_argument("-s", "--start", required=True, |     group.add_argument("-s", "--start", required=True, | ||||||
|                        metavar="TIME", type=self.arg_time, |                        metavar="TIME", type=self.arg_time, | ||||||
| @@ -23,18 +25,31 @@ def setup(self, sub): | |||||||
|                        ).completer = self.complete.time |                        ).completer = self.complete.time | ||||||
|  |  | ||||||
|     group = cmd.add_argument_group("Output format") |     group = cmd.add_argument_group("Output format") | ||||||
|  |     group.add_argument("-q", "--quiet", action="store_true", | ||||||
|  |                        help="Don't display names when removing " | ||||||
|  |                        "from multiple paths") | ||||||
|     group.add_argument("-c", "--count", action="store_true", |     group.add_argument("-c", "--count", action="store_true", | ||||||
|                        help="Output number of data points removed") |                        help="Output number of data points removed") | ||||||
|     return cmd |     return cmd | ||||||
|  |  | ||||||
| def cmd_remove(self): | def cmd_remove(self): | ||||||
|  |     streams = [ s[0] for s in self.client.stream_list() ] | ||||||
|  |     paths = [] | ||||||
|  |     for path in self.args.path: | ||||||
|  |         new = fnmatch.filter(streams, path) | ||||||
|  |         if not new: | ||||||
|  |             self.die("error: no stream matched path: %s", path) | ||||||
|  |         paths.extend(new) | ||||||
|  |  | ||||||
|     try: |     try: | ||||||
|         count = self.client.stream_remove(self.args.path, |         for path in paths: | ||||||
|  |             if not self.args.quiet and len(paths) > 1: | ||||||
|  |                 printf("Removing from %s\n", path) | ||||||
|  |             count = self.client.stream_remove(path, | ||||||
|                                               self.args.start, self.args.end) |                                               self.args.start, self.args.end) | ||||||
|  |             if self.args.count: | ||||||
|  |                 printf("%d\n", count); | ||||||
|     except nilmdb.client.ClientError as e: |     except nilmdb.client.ClientError as e: | ||||||
|         self.die("error removing data: %s", str(e)) |         self.die("error removing data: %s", str(e)) | ||||||
|  |  | ||||||
|     if self.args.count: |  | ||||||
|         printf("%d\n", count) |  | ||||||
|  |  | ||||||
|     return 0 |     return 0 | ||||||
|   | |||||||
							
								
								
									
										5
									
								
								nilmdb/fsck/__init__.py
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										5
									
								
								nilmdb/fsck/__init__.py
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,5 @@ | |||||||
|  | """nilmdb.fsck""" | ||||||
|  |  | ||||||
|  | from __future__ import absolute_import | ||||||
|  |  | ||||||
|  | from nilmdb.fsck.fsck import Fsck | ||||||
							
								
								
									
										450
									
								
								nilmdb/fsck/fsck.py
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										450
									
								
								nilmdb/fsck/fsck.py
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,450 @@ | |||||||
|  | # -*- coding: utf-8 -*- | ||||||
|  |  | ||||||
|  | """Check database consistency, with some ability to fix problems. | ||||||
|  | This should be able to fix cases where a database gets corrupted due | ||||||
|  | to unexpected system shutdown, and detect other cases that may cause | ||||||
|  | NilmDB to return errors when trying to manipulate the database.""" | ||||||
|  |  | ||||||
|  | import nilmdb.utils | ||||||
|  | import nilmdb.server | ||||||
|  | import nilmdb.client.numpyclient | ||||||
|  | from nilmdb.utils.interval import IntervalError | ||||||
|  | from nilmdb.server.interval import Interval, IntervalSet | ||||||
|  | from nilmdb.utils.printf import * | ||||||
|  | from nilmdb.utils.time import timestamp_to_string | ||||||
|  |  | ||||||
|  | from collections import defaultdict | ||||||
|  | import sqlite3 | ||||||
|  | import os | ||||||
|  | import sys | ||||||
|  | import progressbar | ||||||
|  | import re | ||||||
|  | import time | ||||||
|  | import shutil | ||||||
|  | import cPickle as pickle | ||||||
|  | import numpy | ||||||
|  |  | ||||||
|  | class FsckError(Exception): | ||||||
|  |     def __init__(self, msg = "", *args): | ||||||
|  |         if args: | ||||||
|  |             msg = sprintf(msg, *args) | ||||||
|  |         Exception.__init__(self, msg) | ||||||
|  | class FixableFsckError(FsckError): | ||||||
|  |     def __init__(self, msg = "", *args): | ||||||
|  |         if args: | ||||||
|  |             msg = sprintf(msg, *args) | ||||||
|  |         FsckError.__init__(self, "%s\nThis may be fixable with \"--fix\".", msg) | ||||||
|  | class RetryFsck(FsckError): | ||||||
|  |     pass | ||||||
|  |  | ||||||
|  | def log(format, *args): | ||||||
|  |     printf(format, *args) | ||||||
|  |  | ||||||
|  | def err(format, *args): | ||||||
|  |     fprintf(sys.stderr, format, *args) | ||||||
|  |  | ||||||
|  | # Decorator that retries a function if it returns a specific value | ||||||
|  | def retry_if_raised(exc, message = None): | ||||||
|  |     def f1(func): | ||||||
|  |         def f2(*args, **kwargs): | ||||||
|  |             while True: | ||||||
|  |                 try: | ||||||
|  |                     return func(*args, **kwargs) | ||||||
|  |                 except exc as e: | ||||||
|  |                     if message: | ||||||
|  |                         log("%s\n\n", message) | ||||||
|  |         return f2 | ||||||
|  |     return f1 | ||||||
|  |  | ||||||
|  | class Progress(object): | ||||||
|  |     def __init__(self, maxval): | ||||||
|  |         self.bar = progressbar.ProgressBar( | ||||||
|  |             maxval = maxval, | ||||||
|  |             widgets = [ progressbar.Percentage(), ' ', | ||||||
|  |                         progressbar.Bar(), ' ', | ||||||
|  |                         progressbar.ETA() ]) | ||||||
|  |         if self.bar.term_width == 0: | ||||||
|  |             self.bar.term_width = 75 | ||||||
|  |     def __enter__(self): | ||||||
|  |         self.bar.start() | ||||||
|  |         self.last_update = 0 | ||||||
|  |         return self | ||||||
|  |     def __exit__(self, exc_type, exc_value, traceback): | ||||||
|  |         if exc_type is None: | ||||||
|  |             self.bar.finish() | ||||||
|  |         else: | ||||||
|  |             printf("\n") | ||||||
|  |     def update(self, val): | ||||||
|  |         self.bar.update(val) | ||||||
|  |  | ||||||
|  | class Fsck(object): | ||||||
|  |  | ||||||
|  |     def __init__(self, path, fix = False): | ||||||
|  |         self.basepath = path | ||||||
|  |         self.sqlpath = os.path.join(path, "data.sql") | ||||||
|  |         self.bulkpath = os.path.join(path, "data") | ||||||
|  |         self.bulklock = os.path.join(path, "data.lock") | ||||||
|  |         self.fix = fix | ||||||
|  |  | ||||||
|  |     ### Main checks | ||||||
|  |  | ||||||
|  |     @retry_if_raised(RetryFsck, "Something was fixed: restarting fsck") | ||||||
|  |     def check(self): | ||||||
|  |         self.bulk = None | ||||||
|  |         self.sql = None | ||||||
|  |         try: | ||||||
|  |             self.check_paths() | ||||||
|  |             self.check_sql() | ||||||
|  |             self.check_streams() | ||||||
|  |             self.check_intervals() | ||||||
|  |             self.check_data() | ||||||
|  |         finally: | ||||||
|  |             if self.bulk: | ||||||
|  |                 self.bulk.close() | ||||||
|  |             if self.sql: | ||||||
|  |                 self.sql.commit() | ||||||
|  |                 self.sql.close() | ||||||
|  |         log("ok\n") | ||||||
|  |  | ||||||
|  |     ### Check basic path structure | ||||||
|  |  | ||||||
|  |     def check_paths(self): | ||||||
|  |         log("checking paths\n") | ||||||
|  |         if self.bulk: | ||||||
|  |             self.bulk.close() | ||||||
|  |         if not os.path.isfile(self.sqlpath): | ||||||
|  |             raise FsckError("SQL database missing (%s)", self.sqlpath) | ||||||
|  |         if not os.path.isdir(self.bulkpath): | ||||||
|  |             raise FsckError("Bulk data directory missing (%s)", self.bulkpath) | ||||||
|  |         with open(self.bulklock, "w") as lockfile: | ||||||
|  |             if not nilmdb.utils.lock.exclusive_lock(lockfile): | ||||||
|  |                 raise FsckError('database already locked by another process') | ||||||
|  |             # unlocked immediately | ||||||
|  |         self.bulk = nilmdb.server.bulkdata.BulkData(self.basepath) | ||||||
|  |  | ||||||
|  |     ### Check SQL database health | ||||||
|  |  | ||||||
|  |     def check_sql(self): | ||||||
|  |         log("checking sqlite database\n") | ||||||
|  |  | ||||||
|  |         self.sql = sqlite3.connect(self.sqlpath) | ||||||
|  |         with self.sql: | ||||||
|  |             cur = self.sql.cursor() | ||||||
|  |             ver = cur.execute("PRAGMA user_version").fetchone()[0] | ||||||
|  |             good = max(nilmdb.server.nilmdb._sql_schema_updates.keys()) | ||||||
|  |             if ver != good: | ||||||
|  |                 raise FsckError("database version %d too old, should be %d", | ||||||
|  |                                 ver, good) | ||||||
|  |             self.stream_path = {} | ||||||
|  |             self.stream_layout = {} | ||||||
|  |             log("  loading paths\n") | ||||||
|  |             result = cur.execute("SELECT id, path, layout FROM streams") | ||||||
|  |             for r in result: | ||||||
|  |                 if r[0] in self.stream_path: | ||||||
|  |                     raise FsckError("duplicated ID %d in stream IDs", r[0]) | ||||||
|  |                 self.stream_path[r[0]] = r[1] | ||||||
|  |                 self.stream_layout[r[0]] = r[2] | ||||||
|  |  | ||||||
|  |             log("  loading intervals\n") | ||||||
|  |             self.stream_interval = defaultdict(list) | ||||||
|  |             result = cur.execute("SELECT stream_id, start_time, end_time, " | ||||||
|  |                                  "start_pos, end_pos FROM ranges " | ||||||
|  |                                  "ORDER BY start_time") | ||||||
|  |             for r in result: | ||||||
|  |                 if r[0] not in self.stream_path: | ||||||
|  |                     raise FsckError("interval ID %d not in streams", k) | ||||||
|  |                 self.stream_interval[r[0]].append((r[1], r[2], r[3], r[4])) | ||||||
|  |  | ||||||
|  |             log("  loading metadata\n") | ||||||
|  |             self.stream_meta = defaultdict(dict) | ||||||
|  |             result = cur.execute("SELECT stream_id, key, value FROM metadata") | ||||||
|  |             for r in result: | ||||||
|  |                 if r[0] not in self.stream_path: | ||||||
|  |                     raise FsckError("metadata ID %d not in streams", k) | ||||||
|  |                 if r[1] in self.stream_meta[r[0]]: | ||||||
|  |                     raise FsckError("duplicate metadata key '%s' for stream %d", | ||||||
|  |                                     r[1], r[0]) | ||||||
|  |                 self.stream_meta[r[0]][r[1]] = r[2] | ||||||
|  |  | ||||||
|  |     ### Check streams and basic interval overlap | ||||||
|  |  | ||||||
|  |     def check_streams(self): | ||||||
|  |         ids = self.stream_path.keys() | ||||||
|  |         log("checking %d streams\n", len(ids)) | ||||||
|  |         with Progress(len(ids)) as pbar: | ||||||
|  |             for i, sid in enumerate(ids): | ||||||
|  |                 pbar.update(i) | ||||||
|  |                 path = self.stream_path[sid] | ||||||
|  |  | ||||||
|  |                 # unique path, valid layout | ||||||
|  |                 if self.stream_path.values().count(path) != 1: | ||||||
|  |                     raise FsckError("duplicated path %s", path) | ||||||
|  |                 layout = self.stream_layout[sid].split('_')[0] | ||||||
|  |                 if layout not in ('int8', 'int16', 'int32', 'int64', | ||||||
|  |                                   'uint8', 'uint16', 'uint32', 'uint64', | ||||||
|  |                                   'float32', 'float64'): | ||||||
|  |                     raise FsckError("bad layout %s for %s", layout, path) | ||||||
|  |                 count = int(self.stream_layout[sid].split('_')[1]) | ||||||
|  |                 if count < 1 or count > 1024: | ||||||
|  |                     raise FsckError("bad count %d for %s", count, path) | ||||||
|  |  | ||||||
|  |                 # must exist in bulkdata | ||||||
|  |                 bulk = self.bulkpath + path | ||||||
|  |                 if not os.path.isdir(bulk): | ||||||
|  |                     raise FsckError("%s: missing bulkdata dir", path) | ||||||
|  |                 if not nilmdb.server.bulkdata.Table.exists(bulk): | ||||||
|  |                     raise FsckError("%s: bad bulkdata table", path) | ||||||
|  |  | ||||||
|  |                 # intervals don't overlap.  Abuse IntervalSet to check | ||||||
|  |                 # for intervals in file positions, too. | ||||||
|  |                 timeiset = IntervalSet() | ||||||
|  |                 posiset = IntervalSet() | ||||||
|  |                 for (stime, etime, spos, epos) in self.stream_interval[sid]: | ||||||
|  |                     new = Interval(stime, etime) | ||||||
|  |                     try: | ||||||
|  |                         timeiset += new | ||||||
|  |                     except IntervalError: | ||||||
|  |                         raise FsckError("%s: overlap in intervals:\n" | ||||||
|  |                                         "set: %s\nnew: %s", | ||||||
|  |                                         path, str(timeiset), str(new)) | ||||||
|  |                     if spos != epos: | ||||||
|  |                         new = Interval(spos, epos) | ||||||
|  |                         try: | ||||||
|  |                             posiset += new | ||||||
|  |                         except IntervalError: | ||||||
|  |                             raise FsckError("%s: overlap in file offsets:\n" | ||||||
|  |                                             "set: %s\nnew: %s", | ||||||
|  |                                             path, str(posiset), str(new)) | ||||||
|  |  | ||||||
|  |                 # check bulkdata | ||||||
|  |                 self.check_bulkdata(sid, path, bulk) | ||||||
|  |  | ||||||
|  |                 # Check that we can open bulkdata | ||||||
|  |                 try: | ||||||
|  |                     tab = None | ||||||
|  |                     try: | ||||||
|  |                         tab = nilmdb.server.bulkdata.Table(bulk) | ||||||
|  |                     except Exception as e: | ||||||
|  |                         raise FsckError("%s: can't open bulkdata: %s", | ||||||
|  |                                         path, str(e)) | ||||||
|  |                 finally: | ||||||
|  |                     if tab: | ||||||
|  |                         tab.close() | ||||||
|  |  | ||||||
|  |     ### Check that bulkdata is good enough to be opened | ||||||
|  |  | ||||||
|  |     @retry_if_raised(RetryFsck) | ||||||
|  |     def check_bulkdata(self, sid, path, bulk): | ||||||
|  |         with open(os.path.join(bulk, "_format"), "rb") as f: | ||||||
|  |             fmt = pickle.load(f) | ||||||
|  |         if fmt["version"] != 3: | ||||||
|  |             raise FsckError("%s: bad or unsupported bulkdata version %d", | ||||||
|  |                             path, fmt["version"]) | ||||||
|  |         row_per_file = int(fmt["rows_per_file"]) | ||||||
|  |         files_per_dir = int(fmt["files_per_dir"]) | ||||||
|  |         layout = fmt["layout"] | ||||||
|  |         if layout != self.stream_layout[sid]: | ||||||
|  |             raise FsckError("%s: layout mismatch %s != %s", path, | ||||||
|  |                             layout, self.stream_layout[sid]) | ||||||
|  |  | ||||||
|  |         # Every file should have a size that's the multiple of the row size | ||||||
|  |         rkt = nilmdb.server.rocket.Rocket(layout, None) | ||||||
|  |         row_size = rkt.binary_size | ||||||
|  |         rkt.close() | ||||||
|  |  | ||||||
|  |         # Find all directories | ||||||
|  |         regex = re.compile("^[0-9a-f]{4,}$") | ||||||
|  |         subdirs = sorted(filter(regex.search, os.listdir(bulk)), | ||||||
|  |                          key = lambda x: int(x, 16), reverse = True) | ||||||
|  |         for subdir in subdirs: | ||||||
|  |             # Find all files in that dir | ||||||
|  |             subpath = os.path.join(bulk, subdir) | ||||||
|  |             files = filter(regex.search, os.listdir(subpath)) | ||||||
|  |             if not files: | ||||||
|  |                 self.fix_empty_subdir(subpath) | ||||||
|  |                 raise RetryFsck | ||||||
|  |             # Verify that their size is a multiple of the row size | ||||||
|  |             for filename in files: | ||||||
|  |                 filepath = os.path.join(subpath, filename) | ||||||
|  |                 offset = os.path.getsize(filepath) | ||||||
|  |                 if offset % row_size: | ||||||
|  |                     self.fix_bad_filesize(path, filepath, offset, row_size) | ||||||
|  |  | ||||||
|  |     def fix_empty_subdir(self, subpath): | ||||||
|  |         msg = sprintf("bulkdata path %s is missing data files", subpath) | ||||||
|  |         if not self.fix: | ||||||
|  |             raise FixableFsckError(msg) | ||||||
|  |         # Try to fix it by just deleting whatever is present, | ||||||
|  |         # as long as it's only ".removed" files. | ||||||
|  |         err("\n%s\n", msg) | ||||||
|  |         for fn in os.listdir(subpath): | ||||||
|  |             if not fn.endswith(".removed"): | ||||||
|  |                 raise FsckError("can't fix automatically: please manually " | ||||||
|  |                                 "remove the file %s and try again", | ||||||
|  |                                 os.path.join(subpath, fn)) | ||||||
|  |         # Remove the whole thing | ||||||
|  |         err("Removing empty subpath\n") | ||||||
|  |         shutil.rmtree(subpath) | ||||||
|  |         raise RetryFsck | ||||||
|  |  | ||||||
|  |     def fix_bad_filesize(self, path, filepath, offset, row_size): | ||||||
|  |         extra = offset % row_size | ||||||
|  |         msg = sprintf("%s: size of file %s (%d) is not a multiple" + | ||||||
|  |                       " of row size (%d): %d extra bytes present", | ||||||
|  |                       path, filepath, offset, row_size, extra) | ||||||
|  |         if not self.fix: | ||||||
|  |             raise FixableFsckError(msg) | ||||||
|  |         # Try to fix it by just truncating the file | ||||||
|  |         err("\n%s\n", msg) | ||||||
|  |         newsize = offset - extra | ||||||
|  |         err("Truncating file to %d bytes and retrying\n", newsize) | ||||||
|  |         with open(filepath, "r+b") as f: | ||||||
|  |             f.truncate(newsize) | ||||||
|  |             raise RetryFsck | ||||||
|  |  | ||||||
|  |     ### Check interval endpoints | ||||||
|  |  | ||||||
|  |     def check_intervals(self): | ||||||
|  |         total_ints = sum(len(x) for x in self.stream_interval.values()) | ||||||
|  |         log("checking %d intervals\n", total_ints) | ||||||
|  |         done = 0 | ||||||
|  |         with Progress(total_ints) as pbar: | ||||||
|  |             for sid in self.stream_interval: | ||||||
|  |                 try: | ||||||
|  |                     bulk = self.bulkpath + self.stream_path[sid] | ||||||
|  |                     tab = nilmdb.server.bulkdata.Table(bulk) | ||||||
|  |                     def update(x): | ||||||
|  |                         pbar.update(done + x) | ||||||
|  |                     ints = self.stream_interval[sid] | ||||||
|  |                     done += self.check_table_intervals(sid, ints, tab, update) | ||||||
|  |                 finally: | ||||||
|  |                     tab.close() | ||||||
|  |  | ||||||
|  |     def check_table_intervals(self, sid, ints, tab, update): | ||||||
|  |         # look in the table to make sure we can pick out the interval's | ||||||
|  |         # endpoints | ||||||
|  |         path = self.stream_path[sid] | ||||||
|  |         tab.file_open.cache_remove_all() | ||||||
|  |         for (i, intv) in enumerate(ints): | ||||||
|  |             update(i) | ||||||
|  |             (stime, etime, spos, epos) = intv | ||||||
|  |             if spos == epos and spos >= 0 and spos <= tab.nrows: | ||||||
|  |                 continue | ||||||
|  |             try: | ||||||
|  |                 srow = tab[spos] | ||||||
|  |                 erow = tab[epos-1] | ||||||
|  |             except Exception as e: | ||||||
|  |                 self.fix_bad_interval(sid, intv, tab, str(e)) | ||||||
|  |                 raise RetryFsck | ||||||
|  |         return len(ints) | ||||||
|  |  | ||||||
|  |     def fix_bad_interval(self, sid, intv, tab, msg): | ||||||
|  |         path = self.stream_path[sid] | ||||||
|  |         msg = sprintf("%s: interval %s error accessing rows: %s", | ||||||
|  |                       path, str(intv), str(msg)) | ||||||
|  |         if not self.fix: | ||||||
|  |             raise FixableFsckError(msg) | ||||||
|  |         err("\n%s\n", msg) | ||||||
|  |  | ||||||
|  |         (stime, etime, spos, epos) = intv | ||||||
|  |         # If it's just that the end pos is more than the number of rows | ||||||
|  |         # in the table, lower end pos and truncate interval time too. | ||||||
|  |         if spos < tab.nrows and epos >= tab.nrows: | ||||||
|  |             err("end position is past endrows, but it can be truncated\n") | ||||||
|  |             err("old end: time %d, pos %d\n", etime, epos) | ||||||
|  |             new_epos = tab.nrows | ||||||
|  |             new_etime = tab[new_epos-1] + 1 | ||||||
|  |             err("new end: time %d, pos %d\n", new_etime, new_epos) | ||||||
|  |             if stime < new_etime: | ||||||
|  |                 # Change it in SQL | ||||||
|  |                 with self.sql: | ||||||
|  |                     cur = self.sql.cursor() | ||||||
|  |                     cur.execute("UPDATE ranges SET end_time=?, end_pos=? " | ||||||
|  |                                 "WHERE stream_id=? AND start_time=? AND " | ||||||
|  |                                 "end_time=? AND start_pos=? AND end_pos=?", | ||||||
|  |                                 (new_etime, new_epos, sid, stime, etime, | ||||||
|  |                                  spos, epos)) | ||||||
|  |                     if cur.rowcount != 1: | ||||||
|  |                         raise FsckError("failed to fix SQL database") | ||||||
|  |                 raise RetryFsck | ||||||
|  |             err("actually it can't be truncated; times are bad too") | ||||||
|  |  | ||||||
|  |         # Otherwise, the only hope is to delete the interval entirely. | ||||||
|  |         err("*** Deleting the entire interval from SQL.\n") | ||||||
|  |         err("This may leave stale data on disk.  To fix that, copy all\n") | ||||||
|  |         err("data from this stream to a new stream, then remove all data\n") | ||||||
|  |         err("from and destroy %s.\n") | ||||||
|  |         with self.sql: | ||||||
|  |             cur = self.sql.cursor() | ||||||
|  |             cur.execute("DELETE FROM ranges WHERE " | ||||||
|  |                         "stream_id=? AND start_time=? AND " | ||||||
|  |                         "end_time=? AND start_pos=? AND end_pos=?", | ||||||
|  |                         (sid, stime, etime, spos, epos)) | ||||||
|  |             if cur.rowcount != 1: | ||||||
|  |                 raise FsckError("failed to remove interval") | ||||||
|  |         raise RetryFsck | ||||||
|  |  | ||||||
|  |     ### Check data in each interval | ||||||
|  |  | ||||||
|  |     def check_data(self): | ||||||
|  |         total_rows = sum(sum((y[3] - y[2]) for y in x) | ||||||
|  |                          for x in self.stream_interval.values()) | ||||||
|  |         log("checking %d rows of data\n", total_rows) | ||||||
|  |         done = 0 | ||||||
|  |         with Progress(total_rows) as pbar: | ||||||
|  |             for sid in self.stream_interval: | ||||||
|  |                 try: | ||||||
|  |                     bulk = self.bulkpath + self.stream_path[sid] | ||||||
|  |                     tab = nilmdb.server.bulkdata.Table(bulk) | ||||||
|  |                     def update(x): | ||||||
|  |                         pbar.update(done + x) | ||||||
|  |                     ints = self.stream_interval[sid] | ||||||
|  |                     done += self.check_table_data(sid, ints, tab, update) | ||||||
|  |                 finally: | ||||||
|  |                     tab.close() | ||||||
|  |  | ||||||
|  |     def check_table_data(self, sid, ints, tab, update): | ||||||
|  |         # Pull out all of the interval's data and verify that it's | ||||||
|  |         # monotonic. | ||||||
|  |         maxrows = 100000 | ||||||
|  |         path = self.stream_path[sid] | ||||||
|  |         layout = self.stream_layout[sid] | ||||||
|  |         dtype = nilmdb.client.numpyclient.layout_to_dtype(layout) | ||||||
|  |         tab.file_open.cache_remove_all() | ||||||
|  |         done = 0 | ||||||
|  |         for intv in ints: | ||||||
|  |             last_ts = None | ||||||
|  |             (stime, etime, spos, epos) = intv | ||||||
|  |             if spos == epos: | ||||||
|  |                 continue | ||||||
|  |             for start in xrange(*slice(spos, epos, maxrows).indices(epos)): | ||||||
|  |                 stop = min(start + maxrows, epos) | ||||||
|  |                 count = stop - start | ||||||
|  |                 # Get raw data, convert to NumPy arary | ||||||
|  |                 try: | ||||||
|  |                     raw = tab.get_data(start, stop, binary = True) | ||||||
|  |                     data = numpy.fromstring(raw, dtype) | ||||||
|  |                 except Exception as e: | ||||||
|  |                     raise FsckError("%s: failed to grab rows %d through %d: %s", | ||||||
|  |                                     path, start, stop, repr(e)) | ||||||
|  |  | ||||||
|  |                 # Verify that timestamps are monotonic | ||||||
|  |                 if (numpy.diff(data['timestamp']) <= 0).any(): | ||||||
|  |                     raise FsckError("%s: non-monotonic timestamp(s) in rows " | ||||||
|  |                                     "%d through %d", path, start, stop) | ||||||
|  |                 first_ts = data['timestamp'][0] | ||||||
|  |                 if last_ts is not None and first_ts <= last_ts: | ||||||
|  |                     raise FsckError("%s: first interval timestamp %d is not " | ||||||
|  |                                     "greater than the previous last interval " | ||||||
|  |                                     "timestamp %d, at row %d", | ||||||
|  |                                     path, first_ts, last_ts, start) | ||||||
|  |                 last_ts = data['timestamp'][-1] | ||||||
|  |  | ||||||
|  |                 # These are probably fixable, by removing the offending | ||||||
|  |                 # intervals.  But I'm not going to bother implementing | ||||||
|  |                 # that yet. | ||||||
|  |  | ||||||
|  |                 # Done | ||||||
|  |                 done += count | ||||||
|  |                 update(done) | ||||||
|  |         return done | ||||||
							
								
								
									
										25
									
								
								nilmdb/scripts/nilmdb_fsck.py
									
									
									
									
									
										Executable file
									
								
							
							
						
						
									
										25
									
								
								nilmdb/scripts/nilmdb_fsck.py
									
									
									
									
									
										Executable file
									
								
							| @@ -0,0 +1,25 @@ | |||||||
|  | #!/usr/bin/python | ||||||
|  |  | ||||||
|  | import nilmdb.fsck | ||||||
|  | import argparse | ||||||
|  | import os | ||||||
|  | import sys | ||||||
|  |  | ||||||
|  | def main(): | ||||||
|  |     """Main entry point for the 'nilmdb-fsck' command line script""" | ||||||
|  |  | ||||||
|  |     parser = argparse.ArgumentParser( | ||||||
|  |         description = 'Check database consistency', | ||||||
|  |         formatter_class = argparse.ArgumentDefaultsHelpFormatter) | ||||||
|  |     parser.add_argument("-V", "--version", action="version", | ||||||
|  |                         version = nilmdb.__version__) | ||||||
|  |     parser.add_argument("-f", "--fix", action="store_true", | ||||||
|  |                         default=False, help = 'Fix errors when possible ' | ||||||
|  |                         '(which may involve removing data)') | ||||||
|  |     parser.add_argument('database', help = 'Database directory') | ||||||
|  |     args = parser.parse_args() | ||||||
|  |  | ||||||
|  |     nilmdb.fsck.Fsck(args.database, args.fix).check() | ||||||
|  |  | ||||||
|  | if __name__ == "__main__": | ||||||
|  |     main() | ||||||
| @@ -22,7 +22,7 @@ def main(): | |||||||
|     group.add_argument('-p', '--port', help = 'Listen on the given port', |     group.add_argument('-p', '--port', help = 'Listen on the given port', | ||||||
|                        type = int, default = 12380) |                        type = int, default = 12380) | ||||||
|     group.add_argument('-d', '--database', help = 'Database directory', |     group.add_argument('-d', '--database', help = 'Database directory', | ||||||
|                        default = os.path.join(os.getcwd(), "db")) |                        default = "./db") | ||||||
|     group.add_argument('-q', '--quiet', help = 'Silence output', |     group.add_argument('-q', '--quiet', help = 'Silence output', | ||||||
|                        action = 'store_true') |                        action = 'store_true') | ||||||
|     group.add_argument('-t', '--traceback', |     group.add_argument('-t', '--traceback', | ||||||
|   | |||||||
| @@ -17,5 +17,5 @@ except (ImportError, TypeError): # pragma: no cover | |||||||
|     pass |     pass | ||||||
|  |  | ||||||
| from nilmdb.server.nilmdb import NilmDB | from nilmdb.server.nilmdb import NilmDB | ||||||
| from nilmdb.server.server import Server | from nilmdb.server.server import Server, wsgi_application | ||||||
| from nilmdb.server.errors import NilmDBError, StreamError, OverlapError | from nilmdb.server.errors import NilmDBError, StreamError, OverlapError | ||||||
|   | |||||||
| @@ -14,18 +14,21 @@ import re | |||||||
| import sys | import sys | ||||||
| import tempfile | import tempfile | ||||||
|  |  | ||||||
|  | import nilmdb.utils.lock | ||||||
| from . import rocket | from . import rocket | ||||||
|  |  | ||||||
| # Up to 256 open file descriptors at any given time. | # Up to 256 open file descriptors at any given time. | ||||||
| # These variables are global so they can be used in the decorator arguments. | # These variables are global so they can be used in the decorator arguments. | ||||||
| table_cache_size = 16 | table_cache_size = 32 | ||||||
| fd_cache_size = 16 | fd_cache_size = 8 | ||||||
|  |  | ||||||
| @nilmdb.utils.must_close(wrap_verify = False) | @nilmdb.utils.must_close(wrap_verify = False) | ||||||
| class BulkData(object): | class BulkData(object): | ||||||
|     def __init__(self, basepath, **kwargs): |     def __init__(self, basepath, **kwargs): | ||||||
|         self.basepath = basepath |         self.basepath = basepath | ||||||
|         self.root = os.path.join(self.basepath, "data") |         self.root = os.path.join(self.basepath, "data") | ||||||
|  |         self.lock = self.root + ".lock" | ||||||
|  |         self.lockfile = None | ||||||
|  |  | ||||||
|         # Tuneables |         # Tuneables | ||||||
|         if "file_size" in kwargs: |         if "file_size" in kwargs: | ||||||
| @@ -44,8 +47,22 @@ class BulkData(object): | |||||||
|         if not os.path.isdir(self.root): |         if not os.path.isdir(self.root): | ||||||
|             os.mkdir(self.root) |             os.mkdir(self.root) | ||||||
|  |  | ||||||
|  |         # Create the lock | ||||||
|  |         self.lockfile = open(self.lock, "w") | ||||||
|  |         if not nilmdb.utils.lock.exclusive_lock(self.lockfile): | ||||||
|  |             raise IOError('database at "' + self.basepath + | ||||||
|  |                           '" is already locked by another process') | ||||||
|  |  | ||||||
|     def close(self): |     def close(self): | ||||||
|         self.getnode.cache_remove_all() |         self.getnode.cache_remove_all() | ||||||
|  |         if self.lockfile: | ||||||
|  |             nilmdb.utils.lock.exclusive_unlock(self.lockfile) | ||||||
|  |             self.lockfile.close() | ||||||
|  |             try: | ||||||
|  |                 os.unlink(self.lock) | ||||||
|  |             except OSError: # pragma: no cover | ||||||
|  |                 pass | ||||||
|  |             self.lockfile = None | ||||||
|  |  | ||||||
|     def _encode_filename(self, path): |     def _encode_filename(self, path): | ||||||
|         # Encode all paths to UTF-8, regardless of sys.getfilesystemencoding(), |         # Encode all paths to UTF-8, regardless of sys.getfilesystemencoding(), | ||||||
| @@ -62,7 +79,12 @@ class BulkData(object): | |||||||
|         if Table.exists(ospath): |         if Table.exists(ospath): | ||||||
|             raise ValueError("stream already exists at this path") |             raise ValueError("stream already exists at this path") | ||||||
|         if os.path.isdir(ospath): |         if os.path.isdir(ospath): | ||||||
|             raise ValueError("subdirs of this path already exist") |             # Look for any files in subdirectories.  Fully empty subdirectories | ||||||
|  |             # are OK; they might be there during a rename | ||||||
|  |             for (root, dirs, files) in os.walk(ospath): | ||||||
|  |                 if len(files): | ||||||
|  |                     raise ValueError( | ||||||
|  |                         "non-empty subdirs of this path already exist") | ||||||
|  |  | ||||||
|     def _create_parents(self, unicodepath): |     def _create_parents(self, unicodepath): | ||||||
|         """Verify the path name, and create parent directories if they |         """Verify the path name, and create parent directories if they | ||||||
| @@ -134,7 +156,7 @@ class BulkData(object): | |||||||
|  |  | ||||||
|             # Open and cache it |             # Open and cache it | ||||||
|             self.getnode(unicodepath) |             self.getnode(unicodepath) | ||||||
|         except: |         except Exception: | ||||||
|             exc_info = sys.exc_info() |             exc_info = sys.exc_info() | ||||||
|             try: |             try: | ||||||
|                 os.rmdir(ospath) |                 os.rmdir(ospath) | ||||||
| @@ -171,7 +193,6 @@ class BulkData(object): | |||||||
|         # Basic checks |         # Basic checks | ||||||
|         if oldospath == newospath: |         if oldospath == newospath: | ||||||
|             raise ValueError("old and new paths are the same") |             raise ValueError("old and new paths are the same") | ||||||
|         self._create_check_ospath(newospath) |  | ||||||
|  |  | ||||||
|         # Move the table to a temporary location |         # Move the table to a temporary location | ||||||
|         tmpdir = tempfile.mkdtemp(prefix = "rename-", dir = self.root) |         tmpdir = tempfile.mkdtemp(prefix = "rename-", dir = self.root) | ||||||
| @@ -179,6 +200,9 @@ class BulkData(object): | |||||||
|         os.rename(oldospath, tmppath) |         os.rename(oldospath, tmppath) | ||||||
|  |  | ||||||
|         try: |         try: | ||||||
|  |             # Check destination path | ||||||
|  |             self._create_check_ospath(newospath) | ||||||
|  |  | ||||||
|             # Create parent dirs for new location |             # Create parent dirs for new location | ||||||
|             self._create_parents(newunicodepath) |             self._create_parents(newunicodepath) | ||||||
|  |  | ||||||
| @@ -306,7 +330,8 @@ class Table(object): | |||||||
|  |  | ||||||
|         # Find the last directory.  We sort and loop through all of them, |         # Find the last directory.  We sort and loop through all of them, | ||||||
|         # starting with the numerically greatest, because the dirs could be |         # starting with the numerically greatest, because the dirs could be | ||||||
|         # empty if something was deleted. |         # empty if something was deleted but the directory was unexpectedly | ||||||
|  |         # not deleted. | ||||||
|         subdirs = sorted(filter(regex.search, os.listdir(self.root)), |         subdirs = sorted(filter(regex.search, os.listdir(self.root)), | ||||||
|                          key = lambda x: int(x, 16), reverse = True) |                          key = lambda x: int(x, 16), reverse = True) | ||||||
|  |  | ||||||
| @@ -371,7 +396,7 @@ class Table(object): | |||||||
|             # Try deleting subdir, too |             # Try deleting subdir, too | ||||||
|             try: |             try: | ||||||
|                 os.rmdir(os.path.join(self.root, subdir)) |                 os.rmdir(os.path.join(self.root, subdir)) | ||||||
|             except: |             except Exception: | ||||||
|                 pass |                 pass | ||||||
|  |  | ||||||
|     # Cache open files |     # Cache open files | ||||||
| @@ -389,12 +414,16 @@ class Table(object): | |||||||
|         return rocket.Rocket(self.layout, |         return rocket.Rocket(self.layout, | ||||||
|                              os.path.join(self.root, subdir, filename)) |                              os.path.join(self.root, subdir, filename)) | ||||||
|  |  | ||||||
|     def append_string(self, data, start, end): |     def append_data(self, data, start, end, binary = False): | ||||||
|         """Parse the formatted string in 'data', according to the |         """Parse the formatted string in 'data', according to the | ||||||
|         current layout, and append it to the table.  If any timestamps |         current layout, and append it to the table.  If any timestamps | ||||||
|         are non-monotonic, or don't fall between 'start' and 'end', |         are non-monotonic, or don't fall between 'start' and 'end', | ||||||
|         a ValueError is raised. |         a ValueError is raised. | ||||||
|  |  | ||||||
|  |         If 'binary' is True, the data should be in raw binary format | ||||||
|  |         instead: little-endian, matching the current table's layout, | ||||||
|  |         including the int64 timestamp. | ||||||
|  |  | ||||||
|         If this function succeeds, it returns normally.  Otherwise, |         If this function succeeds, it returns normally.  Otherwise, | ||||||
|         the table is reverted back to its original state by truncating |         the table is reverted back to its original state by truncating | ||||||
|         or deleting files as necessary.""" |         or deleting files as necessary.""" | ||||||
| @@ -413,17 +442,26 @@ class Table(object): | |||||||
|                 # Ask the rocket object to parse and append up to "count" |                 # Ask the rocket object to parse and append up to "count" | ||||||
|                 # rows of data, verifying things along the way. |                 # rows of data, verifying things along the way. | ||||||
|                 try: |                 try: | ||||||
|  |                     if binary: | ||||||
|  |                         appender = f.append_binary | ||||||
|  |                     else: | ||||||
|  |                         appender = f.append_string | ||||||
|                     (added_rows, data_offset, last_timestamp, linenum |                     (added_rows, data_offset, last_timestamp, linenum | ||||||
|                      ) = f.append_string(count, data, data_offset, linenum, |                      ) = appender(count, data, data_offset, linenum, | ||||||
|                                   start, end, last_timestamp) |                                   start, end, last_timestamp) | ||||||
|                 except rocket.ParseError as e: |                 except rocket.ParseError as e: | ||||||
|                     (linenum, colnum, errtype, obj) = e.args |                     (linenum, colnum, errtype, obj) = e.args | ||||||
|  |                     if binary: | ||||||
|  |                         where = "byte %d: " % (linenum) | ||||||
|  |                     else: | ||||||
|                         where = "line %d, column %d: " % (linenum, colnum) |                         where = "line %d, column %d: " % (linenum, colnum) | ||||||
|                     # Extract out the error line, add column marker |                     # Extract out the error line, add column marker | ||||||
|                     try: |                     try: | ||||||
|  |                         if binary: | ||||||
|  |                             raise IndexError | ||||||
|                         bad = data.splitlines()[linenum-1] |                         bad = data.splitlines()[linenum-1] | ||||||
|                         badptr = ' ' * (colnum - 1) + '^' |                         bad += '\n' + ' ' * (colnum - 1) + '^' | ||||||
|                     except IndexError: # pragma: no cover |                     except IndexError: | ||||||
|                         bad = "" |                         bad = "" | ||||||
|                     if errtype == rocket.ERR_NON_MONOTONIC: |                     if errtype == rocket.ERR_NON_MONOTONIC: | ||||||
|                         err = "timestamp is not monotonically increasing" |                         err = "timestamp is not monotonically increasing" | ||||||
| @@ -439,7 +477,7 @@ class Table(object): | |||||||
|                     else: |                     else: | ||||||
|                         err = str(obj) |                         err = str(obj) | ||||||
|                     raise ValueError("error parsing input data: " + |                     raise ValueError("error parsing input data: " + | ||||||
|                                      where + err + "\n" + bad + "\n" + badptr) |                                      where + err + "\n" + bad) | ||||||
|                 tot_rows += added_rows |                 tot_rows += added_rows | ||||||
|         except Exception: |         except Exception: | ||||||
|             # Some failure, so try to roll things back by truncating or |             # Some failure, so try to roll things back by truncating or | ||||||
| @@ -455,7 +493,7 @@ class Table(object): | |||||||
|             # Success, so update self.nrows accordingly |             # Success, so update self.nrows accordingly | ||||||
|             self.nrows = tot_rows |             self.nrows = tot_rows | ||||||
|  |  | ||||||
|     def get_data(self, start, stop): |     def get_data(self, start, stop, binary = False): | ||||||
|         """Extract data corresponding to Python range [n:m], |         """Extract data corresponding to Python range [n:m], | ||||||
|         and returns a formatted string""" |         and returns a formatted string""" | ||||||
|         if (start is None or |         if (start is None or | ||||||
| @@ -473,10 +511,13 @@ class Table(object): | |||||||
|             if count > remaining: |             if count > remaining: | ||||||
|                 count = remaining |                 count = remaining | ||||||
|             f = self.file_open(subdir, filename) |             f = self.file_open(subdir, filename) | ||||||
|  |             if binary: | ||||||
|  |                 ret.append(f.extract_binary(offset, count)) | ||||||
|  |             else: | ||||||
|                 ret.append(f.extract_string(offset, count)) |                 ret.append(f.extract_string(offset, count)) | ||||||
|             remaining -= count |             remaining -= count | ||||||
|             row += count |             row += count | ||||||
|         return "".join(ret) |         return b"".join(ret) | ||||||
|  |  | ||||||
|     def __getitem__(self, row): |     def __getitem__(self, row): | ||||||
|         """Extract timestamps from a row, with table[n] notation.""" |         """Extract timestamps from a row, with table[n] notation.""" | ||||||
| @@ -504,7 +545,7 @@ class Table(object): | |||||||
|             with open(cachefile, "rb") as f: |             with open(cachefile, "rb") as f: | ||||||
|                 ranges = pickle.load(f) |                 ranges = pickle.load(f) | ||||||
|             cachefile_present = True |             cachefile_present = True | ||||||
|         except: |         except Exception: | ||||||
|             ranges = [] |             ranges = [] | ||||||
|             cachefile_present = False |             cachefile_present = False | ||||||
|  |  | ||||||
|   | |||||||
| @@ -1,5 +1,9 @@ | |||||||
| """Interval, IntervalSet | """Interval, IntervalSet | ||||||
|  |  | ||||||
|  | The Interval implemented here is just like | ||||||
|  | nilmdb.utils.interval.Interval, except implemented in Cython for | ||||||
|  | speed. | ||||||
|  |  | ||||||
| Represents an interval of time, and a set of such intervals. | Represents an interval of time, and a set of such intervals. | ||||||
|  |  | ||||||
| Intervals are half-open, ie. they include data points with timestamps | Intervals are half-open, ie. they include data points with timestamps | ||||||
| @@ -23,6 +27,7 @@ from ..utils.time import min_timestamp as nilmdb_min_timestamp | |||||||
| from ..utils.time import max_timestamp as nilmdb_max_timestamp | from ..utils.time import max_timestamp as nilmdb_max_timestamp | ||||||
| from ..utils.time import timestamp_to_string | from ..utils.time import timestamp_to_string | ||||||
| from ..utils.iterator import imerge | from ..utils.iterator import imerge | ||||||
|  | from ..utils.interval import IntervalError | ||||||
| import itertools | import itertools | ||||||
|  |  | ||||||
| cimport rbtree | cimport rbtree | ||||||
| @@ -30,10 +35,6 @@ from libc.stdint cimport uint64_t, int64_t | |||||||
|  |  | ||||||
| ctypedef int64_t timestamp_t | ctypedef int64_t timestamp_t | ||||||
|  |  | ||||||
| class IntervalError(Exception): |  | ||||||
|     """Error due to interval overlap, etc""" |  | ||||||
|     pass |  | ||||||
|  |  | ||||||
| cdef class Interval: | cdef class Interval: | ||||||
|     """Represents an interval of time.""" |     """Represents an interval of time.""" | ||||||
|  |  | ||||||
| @@ -59,17 +60,7 @@ cdef class Interval: | |||||||
|  |  | ||||||
|     def __cmp__(self, Interval other): |     def __cmp__(self, Interval other): | ||||||
|         """Compare two intervals.  If non-equal, order by start then end""" |         """Compare two intervals.  If non-equal, order by start then end""" | ||||||
|         if not isinstance(other, Interval): |         return cmp(self.start, other.start) or cmp(self.end, other.end) | ||||||
|             raise TypeError("bad type") |  | ||||||
|         if self.start == other.start: |  | ||||||
|             if self.end < other.end: |  | ||||||
|                 return -1 |  | ||||||
|             if self.end > other.end: |  | ||||||
|                 return 1 |  | ||||||
|             return 0 |  | ||||||
|         if self.start < other.start: |  | ||||||
|             return -1 |  | ||||||
|         return 1 |  | ||||||
|  |  | ||||||
|     cpdef intersects(self, Interval other): |     cpdef intersects(self, Interval other): | ||||||
|         """Return True if two Interval objects intersect""" |         """Return True if two Interval objects intersect""" | ||||||
| @@ -295,81 +286,19 @@ cdef class IntervalSet: | |||||||
|         (potentially) subsetted to make the one that is being |         (potentially) subsetted to make the one that is being | ||||||
|         returned. |         returned. | ||||||
|         """ |         """ | ||||||
|         if not isinstance(interval, Interval): |         if orig: | ||||||
|             raise TypeError("bad type") |  | ||||||
|             for n in self.tree.intersect(interval.start, interval.end): |             for n in self.tree.intersect(interval.start, interval.end): | ||||||
|                 i = n.obj |                 i = n.obj | ||||||
|             if i: |  | ||||||
|                 if i.start >= interval.start and i.end <= interval.end: |  | ||||||
|                     if orig: |  | ||||||
|                         yield (i, i) |  | ||||||
|                     else: |  | ||||||
|                         yield i |  | ||||||
|                 else: |  | ||||||
|                 subset = i.subset(max(i.start, interval.start), |                 subset = i.subset(max(i.start, interval.start), | ||||||
|                                   min(i.end, interval.end)) |                                   min(i.end, interval.end)) | ||||||
|                     if orig: |  | ||||||
|                 yield (subset, i) |                 yield (subset, i) | ||||||
|         else: |         else: | ||||||
|  |             for n in self.tree.intersect(interval.start, interval.end): | ||||||
|  |                 i = n.obj | ||||||
|  |                 subset = i.subset(max(i.start, interval.start), | ||||||
|  |                                   min(i.end, interval.end)) | ||||||
|                 yield subset |                 yield subset | ||||||
|  |  | ||||||
|     def set_difference(self, IntervalSet other not None, |  | ||||||
|                        Interval bounds = None): |  | ||||||
|         """ |  | ||||||
|         Compute the difference (self \\ other) between this |  | ||||||
|         IntervalSet and the given IntervalSet; i.e., the ranges |  | ||||||
|         that are present in 'self' but not 'other'. |  | ||||||
|  |  | ||||||
|         If 'bounds' is not None, results are limited to the range |  | ||||||
|         specified by the interval 'bounds'. |  | ||||||
|  |  | ||||||
|         Returns a generator that yields each interval in turn. |  | ||||||
|         Output intervals are built as subsets of the intervals in the |  | ||||||
|         first argument (self). |  | ||||||
|         """ |  | ||||||
|         # Iterate through all starts and ends in sorted order.  Add a |  | ||||||
|         # tag to the iterator so that we can figure out which one they |  | ||||||
|         # were, after sorting. |  | ||||||
|         def decorate(it, key_start, key_end): |  | ||||||
|             for i in it: |  | ||||||
|                 yield i.start, key_start, i |  | ||||||
|                 yield i.end, key_end, i |  | ||||||
|         if bounds is None: |  | ||||||
|             bounds = Interval(nilmdb_min_timestamp, |  | ||||||
|                               nilmdb_max_timestamp) |  | ||||||
|         self_iter = decorate(self.intersection(bounds), 0, 2) |  | ||||||
|         other_iter = decorate(other.intersection(bounds), 1, 3) |  | ||||||
|  |  | ||||||
|         # Now iterate over the timestamps of each start and end. |  | ||||||
|         # At each point, evaluate which type of end it is, to determine |  | ||||||
|         # how to build up the output intervals. |  | ||||||
|         self_interval = None |  | ||||||
|         other_interval = None |  | ||||||
|         out_start = None |  | ||||||
|         for (ts, k, i) in imerge(self_iter, other_iter): |  | ||||||
|             if k == 0: |  | ||||||
|                 # start self interval |  | ||||||
|                 self_interval = i |  | ||||||
|                 if other_interval is None: |  | ||||||
|                     out_start = ts |  | ||||||
|             elif k == 1: |  | ||||||
|                 # start other interval |  | ||||||
|                 other_interval = i |  | ||||||
|                 if out_start is not None and out_start != ts: |  | ||||||
|                     yield self_interval.subset(out_start, ts) |  | ||||||
|                 out_start = None |  | ||||||
|             elif k == 2: |  | ||||||
|                 # end self interval |  | ||||||
|                 if out_start is not None and out_start != ts: |  | ||||||
|                     yield self_interval.subset(out_start, ts) |  | ||||||
|                 out_start = None |  | ||||||
|                 self_interval = None |  | ||||||
|             elif k == 3: |  | ||||||
|                 # end other interval |  | ||||||
|                 other_interval = None |  | ||||||
|                 if self_interval: |  | ||||||
|                     out_start = ts |  | ||||||
|  |  | ||||||
|     cpdef intersects(self, Interval other): |     cpdef intersects(self, Interval other): | ||||||
|         """Return True if this IntervalSet intersects another interval""" |         """Return True if this IntervalSet intersects another interval""" | ||||||
|         for n in self.tree.intersect(other.start, other.end): |         for n in self.tree.intersect(other.start, other.end): | ||||||
|   | |||||||
| @@ -1,204 +0,0 @@ | |||||||
| # cython: profile=False |  | ||||||
|  |  | ||||||
| import time |  | ||||||
| import sys |  | ||||||
| import inspect |  | ||||||
| import cStringIO |  | ||||||
|  |  | ||||||
| from ..utils.time import min_timestamp as nilmdb_min_timestamp |  | ||||||
|  |  | ||||||
| cdef enum: |  | ||||||
|     max_value_count = 64 |  | ||||||
|  |  | ||||||
| cimport cython |  | ||||||
| cimport libc.stdlib |  | ||||||
| cimport libc.stdio |  | ||||||
| cimport libc.string |  | ||||||
|  |  | ||||||
| class ParserError(Exception): |  | ||||||
|     def __init__(self, line, message): |  | ||||||
|         self.message = "line " + str(line) + ": " + message |  | ||||||
|         Exception.__init__(self, self.message) |  | ||||||
|  |  | ||||||
| class FormatterError(Exception): |  | ||||||
|     pass |  | ||||||
|  |  | ||||||
| class Layout: |  | ||||||
|     """Represents a NILM database layout""" |  | ||||||
|  |  | ||||||
|     def __init__(self, typestring): |  | ||||||
|         """Initialize this Layout object to handle the specified |  | ||||||
|         type string""" |  | ||||||
|         try: |  | ||||||
|             [ datatype, count ] = typestring.split("_") |  | ||||||
|         except: |  | ||||||
|             raise KeyError("invalid layout string") |  | ||||||
|  |  | ||||||
|         try: |  | ||||||
|             self.count = int(count) |  | ||||||
|         except ValueError: |  | ||||||
|             raise KeyError("invalid count") |  | ||||||
|         if self.count < 1 or self.count > max_value_count: |  | ||||||
|             raise KeyError("invalid count") |  | ||||||
|  |  | ||||||
|         if datatype == 'uint16': |  | ||||||
|             self.parse = self.parse_uint16 |  | ||||||
|             self.format_str = "%.6f" + " %d" * self.count |  | ||||||
|             self.format = self.format_generic |  | ||||||
|         elif datatype == 'float32': |  | ||||||
|             self.parse = self.parse_float64 |  | ||||||
|             self.format_str = "%.6f" + " %.6e" * self.count |  | ||||||
|             self.format = self.format_generic |  | ||||||
|         elif datatype == 'float64': |  | ||||||
|             self.parse = self.parse_float64 |  | ||||||
|             self.format_str = "%.6f" + " %.16e" * self.count |  | ||||||
|             self.format = self.format_generic |  | ||||||
|         else: |  | ||||||
|             raise KeyError("invalid type") |  | ||||||
|  |  | ||||||
|         self.datatype = datatype |  | ||||||
|  |  | ||||||
|     # Parsers |  | ||||||
|     def parse_float64(self, char *text): |  | ||||||
|         cdef int n |  | ||||||
|         cdef double ts |  | ||||||
|         # Return doubles even in float32 case, since they're going into |  | ||||||
|         # a Python array which would upconvert to double anyway. |  | ||||||
|         result = [0] * (self.count + 1) |  | ||||||
|         cdef char *end |  | ||||||
|         ts = libc.stdlib.strtod(text, &end) |  | ||||||
|         if end == text: |  | ||||||
|             raise ValueError("bad timestamp") |  | ||||||
|         result[0] = ts |  | ||||||
|         for n in range(self.count): |  | ||||||
|             text = end |  | ||||||
|             result[n+1] = libc.stdlib.strtod(text, &end) |  | ||||||
|             if end == text: |  | ||||||
|                 raise ValueError("wrong number of values") |  | ||||||
|         n = 0 |  | ||||||
|         while end[n] == ' ': |  | ||||||
|             n += 1 |  | ||||||
|         if end[n] != '\n' and end[n] != '#' and end[n] != '\0': |  | ||||||
|             raise ValueError("extra data on line") |  | ||||||
|         return (ts, result) |  | ||||||
|  |  | ||||||
|     def parse_uint16(self, char *text): |  | ||||||
|         cdef int n |  | ||||||
|         cdef double ts |  | ||||||
|         cdef int v |  | ||||||
|         cdef char *end |  | ||||||
|         result = [0] * (self.count + 1) |  | ||||||
|         ts = libc.stdlib.strtod(text, &end) |  | ||||||
|         if end == text: |  | ||||||
|             raise ValueError("bad timestamp") |  | ||||||
|         result[0] = ts |  | ||||||
|         for n in range(self.count): |  | ||||||
|             text = end |  | ||||||
|             v = libc.stdlib.strtol(text, &end, 10) |  | ||||||
|             if v < 0 or v > 65535: |  | ||||||
|                 raise ValueError("value out of range") |  | ||||||
|             result[n+1] = v |  | ||||||
|             if end == text: |  | ||||||
|                 raise ValueError("wrong number of values") |  | ||||||
|         n = 0 |  | ||||||
|         while end[n] == ' ': |  | ||||||
|             n += 1 |  | ||||||
|         if end[n] != '\n' and end[n] != '#' and end[n] != '\0': |  | ||||||
|             raise ValueError("extra data on line") |  | ||||||
|         return (ts, result) |  | ||||||
|  |  | ||||||
|     # Formatters |  | ||||||
|     def format_generic(self, d): |  | ||||||
|         n = len(d) - 1 |  | ||||||
|         if n != self.count: |  | ||||||
|             raise ValueError("wrong number of values for layout type: " |  | ||||||
|                              "got %d, wanted %d" % (n, self.count)) |  | ||||||
|         return (self.format_str % tuple(d)) + "\n" |  | ||||||
|  |  | ||||||
| # Get a layout by name |  | ||||||
| def get_named(typestring): |  | ||||||
|     try: |  | ||||||
|         return Layout(typestring) |  | ||||||
|     except KeyError: |  | ||||||
|         compat = { "PrepData": "float32_8", |  | ||||||
|                    "RawData": "uint16_6", |  | ||||||
|                    "RawNotchedData": "uint16_9" } |  | ||||||
|         return Layout(compat[typestring]) |  | ||||||
|  |  | ||||||
| class Parser(object): |  | ||||||
|     """Object that parses and stores ASCII data for inclusion into the |  | ||||||
|     database""" |  | ||||||
|  |  | ||||||
|     def __init__(self, layout): |  | ||||||
|         if issubclass(layout.__class__, Layout): |  | ||||||
|             self.layout = layout |  | ||||||
|         else: |  | ||||||
|             try: |  | ||||||
|                 self.layout = get_named(layout) |  | ||||||
|             except KeyError: |  | ||||||
|                 raise TypeError("unknown layout") |  | ||||||
|  |  | ||||||
|         self.data = [] |  | ||||||
|         self.min_timestamp = None |  | ||||||
|         self.max_timestamp = None |  | ||||||
|  |  | ||||||
|     def parse(self, textdata): |  | ||||||
|         """ |  | ||||||
|         Parse the data, provided as lines of text, using the current |  | ||||||
|         layout, into an internal data structure suitable for a |  | ||||||
|         pytables 'table.append(parser.data)'. |  | ||||||
|         """ |  | ||||||
|         cdef double last_ts = nilmdb_min_timestamp |  | ||||||
|         cdef double ts |  | ||||||
|         cdef int n = 0, i |  | ||||||
|         cdef char *line |  | ||||||
|  |  | ||||||
|         indata = cStringIO.StringIO(textdata) |  | ||||||
|         # Assume any parsing error is a real error. |  | ||||||
|         # In the future we might want to skip completely empty lines, |  | ||||||
|         # or partial lines right before EOF? |  | ||||||
|         try: |  | ||||||
|             self.data = [] |  | ||||||
|             for pyline in indata: |  | ||||||
|                 line = pyline |  | ||||||
|                 n += 1 |  | ||||||
|                 if line[0] == '\#': |  | ||||||
|                     continue |  | ||||||
|                 (ts, row) = self.layout.parse(line) |  | ||||||
|                 if ts <= last_ts: |  | ||||||
|                     raise ValueError("timestamp is not " |  | ||||||
|                                      "monotonically increasing") |  | ||||||
|                 last_ts = ts |  | ||||||
|                 self.data.append(row) |  | ||||||
|         except (ValueError, IndexError, TypeError) as e: |  | ||||||
|             raise ParserError(n, "error: " + e.message) |  | ||||||
|  |  | ||||||
|         # Mark timestamp ranges |  | ||||||
|         if len(self.data): |  | ||||||
|             self.min_timestamp = self.data[0][0] |  | ||||||
|             self.max_timestamp = self.data[-1][0] |  | ||||||
|  |  | ||||||
| class Formatter(object): |  | ||||||
|     """Object that formats database data into ASCII""" |  | ||||||
|  |  | ||||||
|     def __init__(self, layout): |  | ||||||
|         if issubclass(layout.__class__, Layout): |  | ||||||
|             self.layout = layout |  | ||||||
|         else: |  | ||||||
|             try: |  | ||||||
|                 self.layout = get_named(layout) |  | ||||||
|             except KeyError: |  | ||||||
|                 raise TypeError("unknown layout") |  | ||||||
|  |  | ||||||
|     def format(self, data): |  | ||||||
|         """ |  | ||||||
|         Format raw data from the database, using the current layout, |  | ||||||
|         as lines of ACSII text. |  | ||||||
|         """ |  | ||||||
|         text = cStringIO.StringIO() |  | ||||||
|         try: |  | ||||||
|             for row in data: |  | ||||||
|                 text.write(self.layout.format(row)) |  | ||||||
|         except (ValueError, IndexError, TypeError) as e: |  | ||||||
|             raise FormatterError("formatting error: " + e.message) |  | ||||||
|         return text.getvalue() |  | ||||||
| @@ -12,8 +12,11 @@ Manages both the SQL database and the table storage backend. | |||||||
| from __future__ import absolute_import | from __future__ import absolute_import | ||||||
| import nilmdb.utils | import nilmdb.utils | ||||||
| from nilmdb.utils.printf import * | from nilmdb.utils.printf import * | ||||||
| from nilmdb.server.interval import (Interval, DBInterval, | from nilmdb.utils.time import timestamp_to_string | ||||||
|                                     IntervalSet, IntervalError) |  | ||||||
|  | from nilmdb.utils.interval import IntervalError | ||||||
|  | from nilmdb.server.interval import Interval, DBInterval, IntervalSet | ||||||
|  |  | ||||||
| from nilmdb.server import bulkdata | from nilmdb.server import bulkdata | ||||||
| from nilmdb.server.errors import NilmDBError, StreamError, OverlapError | from nilmdb.server.errors import NilmDBError, StreamError, OverlapError | ||||||
|  |  | ||||||
| @@ -81,7 +84,18 @@ class NilmDB(object): | |||||||
|     verbose = 0 |     verbose = 0 | ||||||
|  |  | ||||||
|     def __init__(self, basepath, max_results=None, |     def __init__(self, basepath, max_results=None, | ||||||
|                  bulkdata_args=None): |                  max_removals=None, bulkdata_args=None): | ||||||
|  |         """Initialize NilmDB at the given basepath. | ||||||
|  |         Other arguments are for debugging / testing: | ||||||
|  |  | ||||||
|  |         'max_results' is the max rows to send in a single | ||||||
|  |         stream_intervals or stream_extract response. | ||||||
|  |  | ||||||
|  |         'max_removals' is the max rows to delete at once | ||||||
|  |         in stream_move. | ||||||
|  |  | ||||||
|  |         'bulkdata_args' is kwargs for the bulkdata module. | ||||||
|  |         """ | ||||||
|         if bulkdata_args is None: |         if bulkdata_args is None: | ||||||
|             bulkdata_args = {} |             bulkdata_args = {} | ||||||
|  |  | ||||||
| @@ -92,7 +106,9 @@ class NilmDB(object): | |||||||
|         try: |         try: | ||||||
|             os.makedirs(self.basepath) |             os.makedirs(self.basepath) | ||||||
|         except OSError as e: |         except OSError as e: | ||||||
|             if e.errno != errno.EEXIST: |             if e.errno != errno.EEXIST: # pragma: no cover | ||||||
|  |                 # (no coverage, because it's hard to trigger this case | ||||||
|  |                 # if tests are run as root) | ||||||
|                 raise IOError("can't create tree " + self.basepath) |                 raise IOError("can't create tree " + self.basepath) | ||||||
|  |  | ||||||
|         # Our data goes inside it |         # Our data goes inside it | ||||||
| @@ -103,19 +119,20 @@ class NilmDB(object): | |||||||
|         self.con = sqlite3.connect(sqlfilename, check_same_thread = True) |         self.con = sqlite3.connect(sqlfilename, check_same_thread = True) | ||||||
|         try: |         try: | ||||||
|             self._sql_schema_update() |             self._sql_schema_update() | ||||||
|         finally: # pragma: no cover |         except Exception: # pragma: no cover | ||||||
|             self.data.close() |             self.data.close() | ||||||
|  |             raise | ||||||
|  |  | ||||||
|         # See big comment at top about the performance implications of this |         # See big comment at top about the performance implications of this | ||||||
|         self.con.execute("PRAGMA synchronous=NORMAL") |         self.con.execute("PRAGMA synchronous=NORMAL") | ||||||
|         self.con.execute("PRAGMA journal_mode=WAL") |         self.con.execute("PRAGMA journal_mode=WAL") | ||||||
|  |  | ||||||
|         # Approximate largest number of elements that we want to send |         # Approximate largest number of elements that we want to send | ||||||
|         # in a single reply (for stream_intervals, stream_extract) |         # in a single reply (for stream_intervals, stream_extract). | ||||||
|         if max_results: |         self.max_results = max_results or 16384 | ||||||
|             self.max_results = max_results |  | ||||||
|         else: |         # Remove up to this many rows per call to stream_remove. | ||||||
|             self.max_results = 16384 |         self.max_removals = max_removals or 1048576 | ||||||
|  |  | ||||||
|     def get_basepath(self): |     def get_basepath(self): | ||||||
|         return self.basepath |         return self.basepath | ||||||
| @@ -159,7 +176,7 @@ class NilmDB(object): | |||||||
|             raise NilmDBError("start must precede end") |             raise NilmDBError("start must precede end") | ||||||
|         return (start, end) |         return (start, end) | ||||||
|  |  | ||||||
|     @nilmdb.utils.lru_cache(size = 16) |     @nilmdb.utils.lru_cache(size = 64) | ||||||
|     def _get_intervals(self, stream_id): |     def _get_intervals(self, stream_id): | ||||||
|         """ |         """ | ||||||
|         Return a mutable IntervalSet corresponding to the given stream ID. |         Return a mutable IntervalSet corresponding to the given stream ID. | ||||||
| @@ -328,18 +345,18 @@ class NilmDB(object): | |||||||
|         List all intervals in 'path' between 'start' and 'end'.  If |         List all intervals in 'path' between 'start' and 'end'.  If | ||||||
|         'diffpath' is not none, list instead the set-difference |         'diffpath' is not none, list instead the set-difference | ||||||
|         between the intervals in the two streams; i.e. all interval |         between the intervals in the two streams; i.e. all interval | ||||||
|         ranges that are present in 'path' but not 'path2'. |         ranges that are present in 'path' but not 'diffpath'. | ||||||
|  |  | ||||||
|         Returns (intervals, restart) tuple. |         Returns (intervals, restart) tuple. | ||||||
|  |  | ||||||
|         intervals is a list of [start,end] timestamps of all intervals |         'intervals' is a list of [start,end] timestamps of all intervals | ||||||
|         that exist for path, between start and end. |         that exist for path, between start and end. | ||||||
|  |  | ||||||
|         restart, if nonzero, means that there were too many results to |         'restart', if not None, means that there were too many results | ||||||
|         return in a single request.  The data is complete from the |         to return in a single request.  The data is complete from the | ||||||
|         starting timestamp to the point at which it was truncated, |         starting timestamp to the point at which it was truncated, and | ||||||
|         and a new request with a start time of 'restart' will fetch |         a new request with a start time of 'restart' will fetch the | ||||||
|         the next block of data. |         next block of data. | ||||||
|         """ |         """ | ||||||
|         stream_id = self._stream_id(path) |         stream_id = self._stream_id(path) | ||||||
|         intervals = self._get_intervals(stream_id) |         intervals = self._get_intervals(stream_id) | ||||||
| @@ -350,7 +367,9 @@ class NilmDB(object): | |||||||
|         requested = Interval(start, end) |         requested = Interval(start, end) | ||||||
|         result = [] |         result = [] | ||||||
|         if diffpath: |         if diffpath: | ||||||
|             getter = intervals.set_difference(diffintervals, requested) |             getter = nilmdb.utils.interval.set_difference( | ||||||
|  |                 intervals.intersection(requested), | ||||||
|  |                 diffintervals.intersection(requested)) | ||||||
|         else: |         else: | ||||||
|             getter = intervals.intersection(requested) |             getter = intervals.intersection(requested) | ||||||
|         for n, i in enumerate(getter): |         for n, i in enumerate(getter): | ||||||
| @@ -359,7 +378,7 @@ class NilmDB(object): | |||||||
|                 break |                 break | ||||||
|             result.append([i.start, i.end]) |             result.append([i.start, i.end]) | ||||||
|         else: |         else: | ||||||
|             restart = 0 |             restart = None | ||||||
|         return (result, restart) |         return (result, restart) | ||||||
|  |  | ||||||
|     def stream_create(self, path, layout_name): |     def stream_create(self, path, layout_name): | ||||||
| @@ -435,28 +454,37 @@ class NilmDB(object): | |||||||
|                         (newpath, stream_id)) |                         (newpath, stream_id)) | ||||||
|  |  | ||||||
|     def stream_destroy(self, path): |     def stream_destroy(self, path): | ||||||
|         """Fully remove a table and all of its data from the database. |         """Fully remove a table from the database.  Fails if there are | ||||||
|         No way to undo it!  Metadata is removed.""" |         any intervals data present; remove them first.  Metadata is | ||||||
|  |         also removed.""" | ||||||
|         stream_id = self._stream_id(path) |         stream_id = self._stream_id(path) | ||||||
|  |  | ||||||
|         # Delete the cached interval data (if it was cached) |         # Verify that no intervals are present, and clear the cache | ||||||
|  |         iset = self._get_intervals(stream_id) | ||||||
|  |         if len(iset): | ||||||
|  |             raise NilmDBError("all intervals must be removed before " | ||||||
|  |                               "destroying a stream") | ||||||
|         self._get_intervals.cache_remove(self, stream_id) |         self._get_intervals.cache_remove(self, stream_id) | ||||||
|  |  | ||||||
|         # Delete the data |         # Delete the bulkdata storage | ||||||
|         self.data.destroy(path) |         self.data.destroy(path) | ||||||
|  |  | ||||||
|         # Delete metadata, stream, intervals |         # Delete metadata, stream, intervals (should be none) | ||||||
|         with self.con as con: |         with self.con as con: | ||||||
|             con.execute("DELETE FROM metadata WHERE stream_id=?", (stream_id,)) |             con.execute("DELETE FROM metadata WHERE stream_id=?", (stream_id,)) | ||||||
|             con.execute("DELETE FROM ranges WHERE stream_id=?", (stream_id,)) |             con.execute("DELETE FROM ranges WHERE stream_id=?", (stream_id,)) | ||||||
|             con.execute("DELETE FROM streams WHERE id=?", (stream_id,)) |             con.execute("DELETE FROM streams WHERE id=?", (stream_id,)) | ||||||
|  |  | ||||||
|     def stream_insert(self, path, start, end, data): |     def stream_insert(self, path, start, end, data, binary = False): | ||||||
|         """Insert new data into the database. |         """Insert new data into the database. | ||||||
|            path: Path at which to add the data |            path: Path at which to add the data | ||||||
|            start: Starting timestamp |            start: Starting timestamp | ||||||
|            end: Ending timestamp |            end: Ending timestamp | ||||||
|            data: Textual data, formatted according to the layout of path |            data: Textual data, formatted according to the layout of path | ||||||
|  |  | ||||||
|  |            'binary', if True, means that 'data' is raw binary: | ||||||
|  |            little-endian, matching the current table's layout, | ||||||
|  |            including the int64 timestamp. | ||||||
|            """ |            """ | ||||||
|         # First check for basic overlap using timestamp info given. |         # First check for basic overlap using timestamp info given. | ||||||
|         stream_id = self._stream_id(path) |         stream_id = self._stream_id(path) | ||||||
| @@ -470,7 +498,7 @@ class NilmDB(object): | |||||||
|         # there are any parse errors. |         # there are any parse errors. | ||||||
|         table = self.data.getnode(path) |         table = self.data.getnode(path) | ||||||
|         row_start = table.nrows |         row_start = table.nrows | ||||||
|         table.append_string(data, start, end) |         table.append_data(data, start, end, binary) | ||||||
|         row_end = table.nrows |         row_end = table.nrows | ||||||
|  |  | ||||||
|         # Insert the record into the sql database. |         # Insert the record into the sql database. | ||||||
| @@ -513,23 +541,31 @@ class NilmDB(object): | |||||||
|                                   dbinterval.db_startpos, |                                   dbinterval.db_startpos, | ||||||
|                                   dbinterval.db_endpos) |                                   dbinterval.db_endpos) | ||||||
|  |  | ||||||
|     def stream_extract(self, path, start = None, end = None, count = False): |     def stream_extract(self, path, start = None, end = None, | ||||||
|  |                        count = False, markup = False, binary = False): | ||||||
|         """ |         """ | ||||||
|         Returns (data, restart) tuple. |         Returns (data, restart) tuple. | ||||||
|  |  | ||||||
|         data is ASCII-formatted data from the database, formatted |         'data' is ASCII-formatted data from the database, formatted | ||||||
|         according to the layout of the stream. |         according to the layout of the stream. | ||||||
|  |  | ||||||
|         restart, if nonzero, means that there were too many results to |         'restart', if not None, means that there were too many results to | ||||||
|         return in a single request.  The data is complete from the |         return in a single request.  The data is complete from the | ||||||
|         starting timestamp to the point at which it was truncated, |         starting timestamp to the point at which it was truncated, | ||||||
|         and a new request with a start time of 'restart' will fetch |         and a new request with a start time of 'restart' will fetch | ||||||
|         the next block of data. |         the next block of data. | ||||||
|  |  | ||||||
|         count, if true, means to not return raw data, but just the count |         'count', if true, means to not return raw data, but just the count | ||||||
|         of rows that would have been returned.  This is much faster |         of rows that would have been returned.  This is much faster | ||||||
|         than actually fetching the data.  It is not limited by |         than actually fetching the data.  It is not limited by | ||||||
|         max_results. |         max_results. | ||||||
|  |  | ||||||
|  |         'markup', if true, indicates that returned data should be | ||||||
|  |         marked with a comment denoting when a particular interval | ||||||
|  |         starts, and another comment when an interval ends. | ||||||
|  |  | ||||||
|  |         'binary', if true, means to return raw binary rather than | ||||||
|  |         ASCII-formatted data. | ||||||
|         """ |         """ | ||||||
|         stream_id = self._stream_id(path) |         stream_id = self._stream_id(path) | ||||||
|         table = self.data.getnode(path) |         table = self.data.getnode(path) | ||||||
| @@ -539,7 +575,9 @@ class NilmDB(object): | |||||||
|         result = [] |         result = [] | ||||||
|         matched = 0 |         matched = 0 | ||||||
|         remaining = self.max_results |         remaining = self.max_results | ||||||
|         restart = 0 |         restart = None | ||||||
|  |         if binary and (markup or count): | ||||||
|  |             raise NilmDBError("binary mode can't be used with markup or count") | ||||||
|         for interval in intervals.intersection(requested): |         for interval in intervals.intersection(requested): | ||||||
|             # Reading single rows from the table is too slow, so |             # Reading single rows from the table is too slow, so | ||||||
|             # we use two bisections to find both the starting and |             # we use two bisections to find both the starting and | ||||||
| @@ -558,14 +596,26 @@ class NilmDB(object): | |||||||
|                 row_end = row_max |                 row_end = row_max | ||||||
|                 restart = table[row_max] |                 restart = table[row_max] | ||||||
|  |  | ||||||
|  |             # Add markup | ||||||
|  |             if markup: | ||||||
|  |                 result.append("# interval-start " + | ||||||
|  |                               timestamp_to_string(interval.start) + "\n") | ||||||
|  |  | ||||||
|             # Gather these results up |             # Gather these results up | ||||||
|             result.append(table.get_data(row_start, row_end)) |             result.append(table.get_data(row_start, row_end, binary)) | ||||||
|  |  | ||||||
|             # Count them |             # Count them | ||||||
|             remaining -= row_end - row_start |             remaining -= row_end - row_start | ||||||
|  |  | ||||||
|             if restart: |             # Add markup, and exit if restart is set. | ||||||
|  |             if restart is not None: | ||||||
|  |                 if markup: | ||||||
|  |                     result.append("# interval-end " + | ||||||
|  |                                   timestamp_to_string(restart) + "\n") | ||||||
|                 break |                 break | ||||||
|  |             if markup: | ||||||
|  |                 result.append("# interval-end " + | ||||||
|  |                               timestamp_to_string(interval.end) + "\n") | ||||||
|  |  | ||||||
|         if count: |         if count: | ||||||
|             return matched |             return matched | ||||||
| @@ -574,9 +624,17 @@ class NilmDB(object): | |||||||
|     def stream_remove(self, path, start = None, end = None): |     def stream_remove(self, path, start = None, end = None): | ||||||
|         """ |         """ | ||||||
|         Remove data from the specified time interval within a stream. |         Remove data from the specified time interval within a stream. | ||||||
|         Removes all data in the interval [start, end), and intervals |  | ||||||
|         are truncated or split appropriately.  Returns the number of |         Removes data in the interval [start, end), and intervals are | ||||||
|         data points removed. |         truncated or split appropriately. | ||||||
|  |  | ||||||
|  |         Returns a (removed, restart) tuple. | ||||||
|  |  | ||||||
|  |         'removed' is the number of data points that were removed. | ||||||
|  |  | ||||||
|  |         'restart', if not None, means there were too many rows to | ||||||
|  |         remove in a single request.  This function should be called | ||||||
|  |         again with a start time of 'restart' to complete the removal. | ||||||
|         """ |         """ | ||||||
|         stream_id = self._stream_id(path) |         stream_id = self._stream_id(path) | ||||||
|         table = self.data.getnode(path) |         table = self.data.getnode(path) | ||||||
| @@ -584,6 +642,8 @@ class NilmDB(object): | |||||||
|         (start, end) = self._check_user_times(start, end) |         (start, end) = self._check_user_times(start, end) | ||||||
|         to_remove = Interval(start, end) |         to_remove = Interval(start, end) | ||||||
|         removed = 0 |         removed = 0 | ||||||
|  |         remaining = self.max_removals | ||||||
|  |         restart = None | ||||||
|  |  | ||||||
|         # Can't remove intervals from within the iterator, so we need to |         # Can't remove intervals from within the iterator, so we need to | ||||||
|         # remember what's currently in the intersection now. |         # remember what's currently in the intersection now. | ||||||
| @@ -594,6 +654,13 @@ class NilmDB(object): | |||||||
|             row_start = self._find_start(table, dbint) |             row_start = self._find_start(table, dbint) | ||||||
|             row_end = self._find_end(table, dbint) |             row_end = self._find_end(table, dbint) | ||||||
|  |  | ||||||
|  |             # Shorten it if we'll hit the maximum number of removals | ||||||
|  |             row_max = row_start + remaining | ||||||
|  |             if row_max < row_end: | ||||||
|  |                 row_end = row_max | ||||||
|  |                 dbint.end = table[row_max] | ||||||
|  |                 restart = dbint.end | ||||||
|  |  | ||||||
|             # Adjust the DBInterval to match the newly found ends |             # Adjust the DBInterval to match the newly found ends | ||||||
|             dbint.db_start = dbint.start |             dbint.db_start = dbint.start | ||||||
|             dbint.db_end = dbint.end |             dbint.db_end = dbint.end | ||||||
| @@ -608,5 +675,9 @@ class NilmDB(object): | |||||||
|  |  | ||||||
|             # Count how many were removed |             # Count how many were removed | ||||||
|             removed += row_end - row_start |             removed += row_end - row_start | ||||||
|  |             remaining -= row_end - row_start | ||||||
|  |  | ||||||
|         return removed |             if restart is not None: | ||||||
|  |                 break | ||||||
|  |  | ||||||
|  |         return (removed, restart) | ||||||
|   | |||||||
| @@ -5,6 +5,9 @@ | |||||||
| #include <ctype.h> | #include <ctype.h> | ||||||
| #include <stdint.h> | #include <stdint.h> | ||||||
|  |  | ||||||
|  | #define __STDC_FORMAT_MACROS | ||||||
|  | #include <inttypes.h> | ||||||
|  |  | ||||||
| /* Values missing from stdint.h */ | /* Values missing from stdint.h */ | ||||||
| #define UINT8_MIN 0 | #define UINT8_MIN 0 | ||||||
| #define UINT16_MIN 0 | #define UINT16_MIN 0 | ||||||
| @@ -19,16 +22,9 @@ | |||||||
|  |  | ||||||
| typedef int64_t timestamp_t; | typedef int64_t timestamp_t; | ||||||
|  |  | ||||||
| /* This code probably needs to be double-checked for the case where |  | ||||||
|    sizeof(long) != 8, so enforce that here with something that will |  | ||||||
|    fail at build time.  We assume that the python integer type can |  | ||||||
|    hold an int64_t. */ |  | ||||||
| const static char __long_ok[1 - 2*!(sizeof(int64_t) == |  | ||||||
| 				    sizeof(long int))] = { 0 }; |  | ||||||
|  |  | ||||||
| /* Somewhat arbitrary, just so we can use fixed sizes for strings | /* Somewhat arbitrary, just so we can use fixed sizes for strings | ||||||
|    etc. */ |    etc. */ | ||||||
| static const int MAX_LAYOUT_COUNT = 128; | static const int MAX_LAYOUT_COUNT = 1024; | ||||||
|  |  | ||||||
| /* Error object and constants */ | /* Error object and constants */ | ||||||
| static PyObject *ParseError; | static PyObject *ParseError; | ||||||
| @@ -58,7 +54,7 @@ static PyObject *raise_str(int line, int col, int code, const char *string) | |||||||
| static PyObject *raise_int(int line, int col, int code, int64_t num) | static PyObject *raise_int(int line, int col, int code, int64_t num) | ||||||
| { | { | ||||||
| 	PyObject *o; | 	PyObject *o; | ||||||
| 	o = Py_BuildValue("(iiil)", line, col, code, num); | 	o = Py_BuildValue("(iiiL)", line, col, code, (long long)num); | ||||||
| 	if (o != NULL) { | 	if (o != NULL) { | ||||||
| 		PyErr_SetObject(ParseError, o); | 		PyErr_SetObject(ParseError, o); | ||||||
| 		Py_DECREF(o); | 		Py_DECREF(o); | ||||||
| @@ -249,11 +245,11 @@ static PyObject *Rocket_get_file_size(Rocket *self) | |||||||
| /**** | /**** | ||||||
|  * Append from string |  * Append from string | ||||||
|  */ |  */ | ||||||
| static inline long int strtol10(const char *nptr, char **endptr) { | static inline long int strtoll10(const char *nptr, char **endptr) { | ||||||
| 	return strtol(nptr, endptr, 10); | 	return strtoll(nptr, endptr, 10); | ||||||
| } | } | ||||||
| static inline long int strtoul10(const char *nptr, char **endptr) { | static inline long int strtoull10(const char *nptr, char **endptr) { | ||||||
| 	return strtoul(nptr, endptr, 10); | 	return strtoull(nptr, endptr, 10); | ||||||
| } | } | ||||||
|  |  | ||||||
| /* .append_string(count, data, offset, linenum, start, end, last_timestamp) */ | /* .append_string(count, data, offset, linenum, start, end, last_timestamp) */ | ||||||
| @@ -264,6 +260,7 @@ static PyObject *Rocket_append_string(Rocket *self, PyObject *args) | |||||||
| 	int offset; | 	int offset; | ||||||
| 	const char *linestart; | 	const char *linestart; | ||||||
| 	int linenum; | 	int linenum; | ||||||
|  |         long long ll1, ll2, ll3; | ||||||
| 	timestamp_t start; | 	timestamp_t start; | ||||||
| 	timestamp_t end; | 	timestamp_t end; | ||||||
| 	timestamp_t last_timestamp; | 	timestamp_t last_timestamp; | ||||||
| @@ -280,10 +277,13 @@ static PyObject *Rocket_append_string(Rocket *self, PyObject *args) | |||||||
| 	   but we need the null termination for strto*.  If we had | 	   but we need the null termination for strto*.  If we had | ||||||
| 	   strnto* that took a length, we could use t# and not require | 	   strnto* that took a length, we could use t# and not require | ||||||
| 	   a copy. */ | 	   a copy. */ | ||||||
| 	if (!PyArg_ParseTuple(args, "isiilll:append_string", &count, | 	if (!PyArg_ParseTuple(args, "isiiLLL:append_string", &count, | ||||||
| 			      &data, &offset, &linenum, | 			      &data, &offset, &linenum, | ||||||
| 			      &start, &end, &last_timestamp)) | 			      &ll1, &ll2, &ll3)) | ||||||
| 		return NULL; | 		return NULL; | ||||||
|  |         start = ll1; | ||||||
|  |         end = ll2; | ||||||
|  |         last_timestamp = ll3; | ||||||
|  |  | ||||||
| 	/* Skip spaces, but don't skip over a newline. */ | 	/* Skip spaces, but don't skip over a newline. */ | ||||||
| #define SKIP_BLANK(buf) do {			\ | #define SKIP_BLANK(buf) do {			\ | ||||||
| @@ -372,14 +372,14 @@ static PyObject *Rocket_append_string(Rocket *self, PyObject *args) | |||||||
| 				goto extra_data_on_line;		\ | 				goto extra_data_on_line;		\ | ||||||
| 			break | 			break | ||||||
|  |  | ||||||
| 			CS(INT8,   strtol10,  t64.i, t8.i,  t8.u,         , 1); | 			CS(INT8,   strtoll10,  t64.i, t8.i,  t8.u,         , 1); | ||||||
| 			CS(UINT8,  strtoul10, t64.u, t8.u,  t8.u,         , 1); | 			CS(UINT8,  strtoull10, t64.u, t8.u,  t8.u,         , 1); | ||||||
| 			CS(INT16,  strtol10,  t64.i, t16.i, t16.u, le16toh, 2); | 			CS(INT16,  strtoll10,  t64.i, t16.i, t16.u, le16toh, 2); | ||||||
| 			CS(UINT16, strtoul10, t64.u, t16.u, t16.u, le16toh, 2); | 			CS(UINT16, strtoull10, t64.u, t16.u, t16.u, le16toh, 2); | ||||||
| 			CS(INT32,  strtol10,  t64.i, t32.i, t32.u, le32toh, 4); | 			CS(INT32,  strtoll10,  t64.i, t32.i, t32.u, le32toh, 4); | ||||||
| 			CS(UINT32, strtoul10, t64.u, t32.u, t32.u, le32toh, 4); | 			CS(UINT32, strtoull10, t64.u, t32.u, t32.u, le32toh, 4); | ||||||
| 			CS(INT64,  strtol10,  t64.i, t64.i, t64.u, le64toh, 8); | 			CS(INT64,  strtoll10,  t64.i, t64.i, t64.u, le64toh, 8); | ||||||
| 			CS(UINT64, strtoul10, t64.u, t64.u, t64.u, le64toh, 8); | 			CS(UINT64, strtoull10, t64.u, t64.u, t64.u, le64toh, 8); | ||||||
| 			CS(FLOAT32, strtod,   t64.d, t32.f, t32.u, le32toh, 4); | 			CS(FLOAT32, strtod,   t64.d, t32.f, t32.u, le32toh, 4); | ||||||
| 			CS(FLOAT64, strtod,   t64.d, t64.d, t64.u, le64toh, 8); | 			CS(FLOAT64, strtod,   t64.d, t64.d, t64.u, le64toh, 8); | ||||||
| #undef CS | #undef CS | ||||||
| @@ -397,7 +397,8 @@ static PyObject *Rocket_append_string(Rocket *self, PyObject *args) | |||||||
| 	/* Build return value and return */ | 	/* Build return value and return */ | ||||||
| 	offset = buf - data; | 	offset = buf - data; | ||||||
| 	PyObject *o; | 	PyObject *o; | ||||||
| 	o = Py_BuildValue("(iili)", written, offset, last_timestamp, linenum); | 	o = Py_BuildValue("(iiLi)", written, offset, | ||||||
|  |                           (long long)last_timestamp, linenum); | ||||||
| 	return o; | 	return o; | ||||||
| err: | err: | ||||||
| 	PyErr_SetFromErrno(PyExc_OSError); | 	PyErr_SetFromErrno(PyExc_OSError); | ||||||
| @@ -419,6 +420,72 @@ extra_data_on_line: | |||||||
| 			 ERR_OTHER, "extra data on line"); | 			 ERR_OTHER, "extra data on line"); | ||||||
| } | } | ||||||
|  |  | ||||||
|  | /**** | ||||||
|  |  * Append from binary data | ||||||
|  |  */ | ||||||
|  |  | ||||||
|  | /* .append_binary(count, data, offset, linenum, start, end, last_timestamp) */ | ||||||
|  | static PyObject *Rocket_append_binary(Rocket *self, PyObject *args) | ||||||
|  | { | ||||||
|  |         int count; | ||||||
|  | 	const uint8_t *data; | ||||||
|  |         int data_len; | ||||||
|  |         int linenum; | ||||||
|  | 	int offset; | ||||||
|  |         long long ll1, ll2, ll3; | ||||||
|  | 	timestamp_t start; | ||||||
|  | 	timestamp_t end; | ||||||
|  | 	timestamp_t last_timestamp; | ||||||
|  |  | ||||||
|  | 	if (!PyArg_ParseTuple(args, "it#iiLLL:append_binary", | ||||||
|  |                               &count, &data, &data_len, &offset, | ||||||
|  |                               &linenum, &ll1, &ll2, &ll3)) | ||||||
|  | 		return NULL; | ||||||
|  |         start = ll1; | ||||||
|  |         end = ll2; | ||||||
|  |         last_timestamp = ll3; | ||||||
|  |  | ||||||
|  |         /* Advance to offset */ | ||||||
|  |         if (offset > data_len) | ||||||
|  |                 return raise_str(0, 0, ERR_OTHER, "bad offset"); | ||||||
|  |         data += offset; | ||||||
|  |         data_len -= offset; | ||||||
|  |  | ||||||
|  |         /* Figure out max number of rows to insert */ | ||||||
|  |         int rows = data_len / self->binary_size; | ||||||
|  |         if (rows > count) | ||||||
|  |                 rows = count; | ||||||
|  |  | ||||||
|  |         /* Check timestamps */ | ||||||
|  |         timestamp_t ts; | ||||||
|  | 	int i; | ||||||
|  |         for (i = 0; i < rows; i++) { | ||||||
|  |                 /* Read raw timestamp, byteswap if needed */ | ||||||
|  |                 memcpy(&ts, &data[i * self->binary_size], 8); | ||||||
|  |                 ts = le64toh(ts); | ||||||
|  |  | ||||||
|  |                 /* Check limits */ | ||||||
|  |                 if (ts <= last_timestamp) | ||||||
|  |                         return raise_int(i, 0, ERR_NON_MONOTONIC, ts); | ||||||
|  |                 last_timestamp = ts; | ||||||
|  |                 if (ts < start || ts >= end) | ||||||
|  |                         return raise_int(i, 0, ERR_OUT_OF_INTERVAL, ts); | ||||||
|  |         } | ||||||
|  |  | ||||||
|  |         /* Write binary data */ | ||||||
|  |         if (fwrite(data, self->binary_size, rows, self->file) != rows) { | ||||||
|  |                 PyErr_SetFromErrno(PyExc_OSError); | ||||||
|  |                 return NULL; | ||||||
|  |         } | ||||||
|  | 	fflush(self->file); | ||||||
|  |  | ||||||
|  | 	/* Build return value and return */ | ||||||
|  | 	PyObject *o; | ||||||
|  | 	o = Py_BuildValue("(iiLi)", rows, offset + rows * self->binary_size, | ||||||
|  |                           (long long)last_timestamp, linenum); | ||||||
|  | 	return o; | ||||||
|  | } | ||||||
|  |  | ||||||
| /**** | /**** | ||||||
|  * Extract to string |  * Extract to string | ||||||
|  */ |  */ | ||||||
| @@ -472,7 +539,7 @@ static PyObject *Rocket_extract_string(Rocket *self, PyObject *args) | |||||||
| 		if (fread(&t64.u, 8, 1, self->file) != 1) | 		if (fread(&t64.u, 8, 1, self->file) != 1) | ||||||
| 			goto err; | 			goto err; | ||||||
| 		t64.u = le64toh(t64.u); | 		t64.u = le64toh(t64.u); | ||||||
| 		ret = sprintf(&str[len], "%ld", t64.i); | 		ret = sprintf(&str[len], "%" PRId64, t64.i); | ||||||
| 		if (ret <= 0) | 		if (ret <= 0) | ||||||
| 			goto err; | 			goto err; | ||||||
| 		len += ret; | 		len += ret; | ||||||
| @@ -484,7 +551,7 @@ static PyObject *Rocket_extract_string(Rocket *self, PyObject *args) | |||||||
| 			/* read and format in a loop */			\ | 			/* read and format in a loop */			\ | ||||||
| 			for (i = 0; i < self->layout_count; i++) {	\ | 			for (i = 0; i < self->layout_count; i++) {	\ | ||||||
| 				if (fread(&disktype, bytes,		\ | 				if (fread(&disktype, bytes,		\ | ||||||
| 					  1, self->file) < 0)		\ | 					  1, self->file) != 1)		\ | ||||||
| 					goto err;			\ | 					goto err;			\ | ||||||
| 				disktype = letoh(disktype);		\ | 				disktype = letoh(disktype);		\ | ||||||
| 				ret = sprintf(&str[len], " " fmt,	\ | 				ret = sprintf(&str[len], " " fmt,	\ | ||||||
| @@ -494,14 +561,14 @@ static PyObject *Rocket_extract_string(Rocket *self, PyObject *args) | |||||||
| 				len += ret;				\ | 				len += ret;				\ | ||||||
| 			}						\ | 			}						\ | ||||||
| 			break | 			break | ||||||
| 			CASE(INT8,   "%hhd",   t8.i,  t8.u,         , 1); | 			CASE(INT8,   "%" PRId8,  t8.i,  t8.u,         , 1); | ||||||
| 			CASE(UINT8,  "%hhu",   t8.u,  t8.u,         , 1); | 			CASE(UINT8,  "%" PRIu8,  t8.u,  t8.u,         , 1); | ||||||
| 			CASE(INT16,  "%hd",    t16.i, t16.u, le16toh, 2); | 			CASE(INT16,  "%" PRId16, t16.i, t16.u, le16toh, 2); | ||||||
| 			CASE(UINT16, "%hu",    t16.u, t16.u, le16toh, 2); | 			CASE(UINT16, "%" PRIu16, t16.u, t16.u, le16toh, 2); | ||||||
| 			CASE(INT32,  "%d",     t32.i, t32.u, le32toh, 4); | 			CASE(INT32,  "%" PRId32, t32.i, t32.u, le32toh, 4); | ||||||
| 			CASE(UINT32, "%u",     t32.u, t32.u, le32toh, 4); | 			CASE(UINT32, "%" PRIu32, t32.u, t32.u, le32toh, 4); | ||||||
| 			CASE(INT64,  "%ld",    t64.i, t64.u, le64toh, 8); | 			CASE(INT64,  "%" PRId64, t64.i, t64.u, le64toh, 8); | ||||||
| 			CASE(UINT64, "%lu",    t64.u, t64.u, le64toh, 8); | 			CASE(UINT64, "%" PRIu64, t64.u, t64.u, le64toh, 8); | ||||||
| 			/* These next two are a bit debatable.  floats | 			/* These next two are a bit debatable.  floats | ||||||
| 			   are 6-9 significant figures, so we print 7. | 			   are 6-9 significant figures, so we print 7. | ||||||
| 			   Doubles are 15-19, so we print 17.  This is | 			   Doubles are 15-19, so we print 17.  This is | ||||||
| @@ -527,6 +594,46 @@ err: | |||||||
| 	return NULL; | 	return NULL; | ||||||
| } | } | ||||||
|  |  | ||||||
|  | /**** | ||||||
|  |  * Extract to binary string containing raw little-endian binary data | ||||||
|  |  */ | ||||||
|  | static PyObject *Rocket_extract_binary(Rocket *self, PyObject *args) | ||||||
|  | { | ||||||
|  | 	long count; | ||||||
|  | 	long offset; | ||||||
|  |  | ||||||
|  | 	if (!PyArg_ParseTuple(args, "ll", &offset, &count)) | ||||||
|  | 		return NULL; | ||||||
|  | 	if (!self->file) { | ||||||
|  | 		PyErr_SetString(PyExc_Exception, "no file"); | ||||||
|  | 		return NULL; | ||||||
|  | 	} | ||||||
|  | 	/* Seek to target location */ | ||||||
|  | 	if (fseek(self->file, offset, SEEK_SET) < 0) { | ||||||
|  | 		PyErr_SetFromErrno(PyExc_OSError); | ||||||
|  | 		return NULL; | ||||||
|  | 	} | ||||||
|  |  | ||||||
|  |         uint8_t *str; | ||||||
|  |         int len = count * self->binary_size; | ||||||
|  |         str = malloc(len); | ||||||
|  |         if (str == NULL) { | ||||||
|  |                 PyErr_SetFromErrno(PyExc_OSError); | ||||||
|  |                 return NULL; | ||||||
|  |         } | ||||||
|  |  | ||||||
|  |         /* Data in the file is already in the desired little-endian | ||||||
|  |            binary format, so just read it directly. */ | ||||||
|  |         if (fread(str, self->binary_size, count, self->file) != count) { | ||||||
|  |                 free(str); | ||||||
|  |                 PyErr_SetFromErrno(PyExc_OSError); | ||||||
|  |                 return NULL; | ||||||
|  |         } | ||||||
|  |  | ||||||
|  | 	PyObject *pystr = PyBytes_FromStringAndSize((char *)str, len); | ||||||
|  | 	free(str); | ||||||
|  | 	return pystr; | ||||||
|  | } | ||||||
|  |  | ||||||
| /**** | /**** | ||||||
|  * Extract timestamp |  * Extract timestamp | ||||||
| @@ -551,7 +658,7 @@ static PyObject *Rocket_extract_timestamp(Rocket *self, PyObject *args) | |||||||
|  |  | ||||||
| 	/* Convert and return */ | 	/* Convert and return */ | ||||||
| 	t64.u = le64toh(t64.u); | 	t64.u = le64toh(t64.u); | ||||||
| 	return Py_BuildValue("l", t64.i); | 	return Py_BuildValue("L", (long long)t64.i); | ||||||
| } | } | ||||||
|  |  | ||||||
| /**** | /**** | ||||||
| @@ -571,11 +678,13 @@ static PyMemberDef Rocket_members[] = { | |||||||
| }; | }; | ||||||
|  |  | ||||||
| static PyMethodDef Rocket_methods[] = { | static PyMethodDef Rocket_methods[] = { | ||||||
| 	{ "close", (PyCFunction)Rocket_close, METH_NOARGS, | 	{ "close", | ||||||
|  |           (PyCFunction)Rocket_close, METH_NOARGS, | ||||||
| 	  "close(self)\n\n" | 	  "close(self)\n\n" | ||||||
| 	  "Close file handle" }, | 	  "Close file handle" }, | ||||||
|  |  | ||||||
| 	{ "append_string", (PyCFunction)Rocket_append_string, METH_VARARGS, | 	{ "append_string", | ||||||
|  |           (PyCFunction)Rocket_append_string, METH_VARARGS, | ||||||
| 	  "append_string(self, count, data, offset, line, start, end, ts)\n\n" | 	  "append_string(self, count, data, offset, line, start, end, ts)\n\n" | ||||||
|           "Parse string and append data.\n" |           "Parse string and append data.\n" | ||||||
| 	  "\n" | 	  "\n" | ||||||
| @@ -590,16 +699,46 @@ static PyMethodDef Rocket_methods[] = { | |||||||
| 	  "Raises ParseError if timestamps are non-monotonic, outside\n" | 	  "Raises ParseError if timestamps are non-monotonic, outside\n" | ||||||
| 	  "the start/end interval etc.\n" | 	  "the start/end interval etc.\n" | ||||||
| 	  "\n" | 	  "\n" | ||||||
|           "On success, return a tuple with three values:\n" |           "On success, return a tuple:\n" | ||||||
|           "  added_rows: how many rows were added from the file\n" |           "  added_rows: how many rows were added from the file\n" | ||||||
|           "  data_offset: current offset into the data string\n" |           "  data_offset: current offset into the data string\n" | ||||||
|           "  last_timestamp: last timestamp we parsed" }, |           "  last_timestamp: last timestamp we parsed\n" | ||||||
|  |           "  linenum: current line number" }, | ||||||
|  |  | ||||||
| 	{ "extract_string", (PyCFunction)Rocket_extract_string, METH_VARARGS, | 	{ "append_binary", | ||||||
|  | 	  (PyCFunction)Rocket_append_binary, METH_VARARGS, | ||||||
|  | 	  "append_binary(self, count, data, offset, line, start, end, ts)\n\n" | ||||||
|  |           "Append binary data, which must match the data layout.\n" | ||||||
|  | 	  "\n" | ||||||
|  | 	  "  count: maximum number of rows to add\n" | ||||||
|  |           "  data: binary data\n" | ||||||
|  |           "  offset: byte offset into data to start adding\n" | ||||||
|  |           "  line: current line number (unused)\n" | ||||||
|  |           "  start: starting timestamp for interval\n" | ||||||
|  |           "  end: end timestamp for interval\n" | ||||||
|  |           "  ts: last timestamp that was previously parsed\n" | ||||||
|  | 	  "\n" | ||||||
|  | 	  "Raises ParseError if timestamps are non-monotonic, outside\n" | ||||||
|  | 	  "the start/end interval etc.\n" | ||||||
|  | 	  "\n" | ||||||
|  |           "On success, return a tuple:\n" | ||||||
|  |           "  added_rows: how many rows were added from the file\n" | ||||||
|  |           "  data_offset: current offset into the data string\n" | ||||||
|  |           "  last_timestamp: last timestamp we parsed\n" | ||||||
|  |           "  linenum: current line number (copied from argument)" }, | ||||||
|  |  | ||||||
|  | 	{ "extract_string", | ||||||
|  |           (PyCFunction)Rocket_extract_string, METH_VARARGS, | ||||||
| 	  "extract_string(self, offset, count)\n\n" | 	  "extract_string(self, offset, count)\n\n" | ||||||
| 	  "Extract count rows of data from the file at offset offset.\n" | 	  "Extract count rows of data from the file at offset offset.\n" | ||||||
| 	  "Return an ascii formatted string according to the layout" }, | 	  "Return an ascii formatted string according to the layout" }, | ||||||
|  |  | ||||||
|  | 	{ "extract_binary", | ||||||
|  | 	  (PyCFunction)Rocket_extract_binary, METH_VARARGS, | ||||||
|  | 	  "extract_binary(self, offset, count)\n\n" | ||||||
|  | 	  "Extract count rows of data from the file at offset offset.\n" | ||||||
|  | 	  "Return a raw binary string of data matching the data layout." }, | ||||||
|  |  | ||||||
| 	{ "extract_timestamp", | 	{ "extract_timestamp", | ||||||
| 	  (PyCFunction)Rocket_extract_timestamp, METH_VARARGS, | 	  (PyCFunction)Rocket_extract_timestamp, METH_VARARGS, | ||||||
| 	  "extract_timestamp(self, offset)\n\n" | 	  "extract_timestamp(self, offset)\n\n" | ||||||
|   | |||||||
| @@ -11,130 +11,32 @@ from nilmdb.utils.time import string_to_timestamp | |||||||
| import cherrypy | import cherrypy | ||||||
| import sys | import sys | ||||||
| import os | import os | ||||||
|  | import socket | ||||||
| import simplejson as json | import simplejson as json | ||||||
| import decorator | import decorator | ||||||
| import psutil | import psutil | ||||||
|  | import traceback | ||||||
|  |  | ||||||
|  | from nilmdb.server.serverutil import ( | ||||||
|  |     chunked_response, | ||||||
|  |     response_type, | ||||||
|  |     workaround_cp_bug_1200, | ||||||
|  |     exception_to_httperror, | ||||||
|  |     CORS_allow, | ||||||
|  |     json_to_request_params, | ||||||
|  |     json_error_page, | ||||||
|  |     cherrypy_start, | ||||||
|  |     cherrypy_stop, | ||||||
|  |     bool_param, | ||||||
|  |     ) | ||||||
|  |  | ||||||
|  | # Add CORS_allow tool | ||||||
|  | cherrypy.tools.CORS_allow = cherrypy.Tool('on_start_resource', CORS_allow) | ||||||
|  |  | ||||||
| class NilmApp(object): | class NilmApp(object): | ||||||
|     def __init__(self, db): |     def __init__(self, db): | ||||||
|         self.db = db |         self.db = db | ||||||
|  |  | ||||||
| # Decorators |  | ||||||
| def chunked_response(func): |  | ||||||
|     """Decorator to enable chunked responses.""" |  | ||||||
|     # Set this to False to get better tracebacks from some requests |  | ||||||
|     # (/stream/extract, /stream/intervals). |  | ||||||
|     func._cp_config = { 'response.stream': True } |  | ||||||
|     return func |  | ||||||
|  |  | ||||||
| def response_type(content_type): |  | ||||||
|     """Return a decorator-generating function that sets the |  | ||||||
|     response type to the specified string.""" |  | ||||||
|     def wrapper(func, *args, **kwargs): |  | ||||||
|         cherrypy.response.headers['Content-Type'] = content_type |  | ||||||
|         return func(*args, **kwargs) |  | ||||||
|     return decorator.decorator(wrapper) |  | ||||||
|  |  | ||||||
| @decorator.decorator |  | ||||||
| def workaround_cp_bug_1200(func, *args, **kwargs): # pragma: no cover |  | ||||||
|     """Decorator to work around CherryPy bug #1200 in a response |  | ||||||
|     generator. |  | ||||||
|  |  | ||||||
|     Even if chunked responses are disabled, LookupError or |  | ||||||
|     UnicodeError exceptions may still be swallowed by CherryPy due to |  | ||||||
|     bug #1200.  This throws them as generic Exceptions instead so that |  | ||||||
|     they make it through. |  | ||||||
|     """ |  | ||||||
|     exc_info = None |  | ||||||
|     try: |  | ||||||
|         for val in func(*args, **kwargs): |  | ||||||
|             yield val |  | ||||||
|     except (LookupError, UnicodeError): |  | ||||||
|         # Re-raise it, but maintain the original traceback |  | ||||||
|         exc_info = sys.exc_info() |  | ||||||
|         new_exc = Exception(exc_info[0].__name__ + ": " + str(exc_info[1])) |  | ||||||
|         raise new_exc, None, exc_info[2] |  | ||||||
|     finally: |  | ||||||
|         del exc_info |  | ||||||
|  |  | ||||||
| def exception_to_httperror(*expected): |  | ||||||
|     """Return a decorator-generating function that catches expected |  | ||||||
|     errors and throws a HTTPError describing it instead. |  | ||||||
|  |  | ||||||
|         @exception_to_httperror(NilmDBError, ValueError) |  | ||||||
|         def foo(): |  | ||||||
|             pass |  | ||||||
|     """ |  | ||||||
|     def wrapper(func, *args, **kwargs): |  | ||||||
|         exc_info = None |  | ||||||
|         try: |  | ||||||
|             return func(*args, **kwargs) |  | ||||||
|         except expected: |  | ||||||
|             # Re-raise it, but maintain the original traceback |  | ||||||
|             exc_info = sys.exc_info() |  | ||||||
|             new_exc = cherrypy.HTTPError("400 Bad Request", str(exc_info[1])) |  | ||||||
|             raise new_exc, None, exc_info[2] |  | ||||||
|         finally: |  | ||||||
|             del exc_info |  | ||||||
|     # We need to preserve the function's argspecs for CherryPy to |  | ||||||
|     # handle argument errors correctly.  Decorator.decorator takes |  | ||||||
|     # care of that. |  | ||||||
|     return decorator.decorator(wrapper) |  | ||||||
|  |  | ||||||
| # Custom CherryPy tools |  | ||||||
|  |  | ||||||
| def CORS_allow(methods): |  | ||||||
|     """This does several things: |  | ||||||
|  |  | ||||||
|     Handles CORS preflight requests. |  | ||||||
|     Adds Allow: header to all requests. |  | ||||||
|     Raise 405 if request.method not in method. |  | ||||||
|  |  | ||||||
|     It is similar to cherrypy.tools.allow, with the CORS stuff added. |  | ||||||
|     """ |  | ||||||
|     request = cherrypy.request.headers |  | ||||||
|     response = cherrypy.response.headers |  | ||||||
|  |  | ||||||
|     if not isinstance(methods, (tuple, list)): # pragma: no cover |  | ||||||
|         methods = [ methods ] |  | ||||||
|     methods = [ m.upper() for m in methods if m ] |  | ||||||
|     if not methods: # pragma: no cover |  | ||||||
|         methods = [ 'GET', 'HEAD' ] |  | ||||||
|     elif 'GET' in methods and 'HEAD' not in methods: # pragma: no cover |  | ||||||
|         methods.append('HEAD') |  | ||||||
|     response['Allow'] = ', '.join(methods) |  | ||||||
|  |  | ||||||
|     # Allow all origins |  | ||||||
|     if 'Origin' in request: |  | ||||||
|         response['Access-Control-Allow-Origin'] = request['Origin'] |  | ||||||
|  |  | ||||||
|     # If it's a CORS request, send response. |  | ||||||
|     request_method = request.get("Access-Control-Request-Method", None) |  | ||||||
|     request_headers = request.get("Access-Control-Request-Headers", None) |  | ||||||
|     if (cherrypy.request.method == "OPTIONS" and |  | ||||||
|         request_method and request_headers): |  | ||||||
|         response['Access-Control-Allow-Headers'] = request_headers |  | ||||||
|         response['Access-Control-Allow-Methods'] = ', '.join(methods) |  | ||||||
|         # Try to stop further processing and return a 200 OK |  | ||||||
|         cherrypy.response.status = "200 OK" |  | ||||||
|         cherrypy.response.body = "" |  | ||||||
|         cherrypy.request.handler = lambda: "" |  | ||||||
|         return |  | ||||||
|  |  | ||||||
|     # Reject methods that were not explicitly allowed |  | ||||||
|     if cherrypy.request.method not in methods: |  | ||||||
|         raise cherrypy.HTTPError(405) |  | ||||||
|  |  | ||||||
| cherrypy.tools.CORS_allow = cherrypy.Tool('on_start_resource', CORS_allow) |  | ||||||
|  |  | ||||||
| # Helper for json_in tool to process JSON data into normal request |  | ||||||
| # parameters. |  | ||||||
| def json_to_request_params(body): |  | ||||||
|     cherrypy.lib.jsontools.json_processor(body) |  | ||||||
|     if not isinstance(cherrypy.request.json, dict): |  | ||||||
|         raise cherrypy.HTTPError(415) |  | ||||||
|     cherrypy.request.params.update(cherrypy.request.json) |  | ||||||
|  |  | ||||||
| # CherryPy apps | # CherryPy apps | ||||||
| class Root(NilmApp): | class Root(NilmApp): | ||||||
|     """Root application for NILM database""" |     """Root application for NILM database""" | ||||||
| @@ -145,7 +47,10 @@ class Root(NilmApp): | |||||||
|     # / |     # / | ||||||
|     @cherrypy.expose |     @cherrypy.expose | ||||||
|     def index(self): |     def index(self): | ||||||
|         raise cherrypy.NotFound() |         cherrypy.response.headers['Content-Type'] = 'text/plain' | ||||||
|  |         msg = sprintf("This is NilmDB version %s, running on host %s.\n", | ||||||
|  |                       nilmdb.__version__, socket.getfqdn()) | ||||||
|  |         return msg | ||||||
|  |  | ||||||
|     # /favicon.ico |     # /favicon.ico | ||||||
|     @cherrypy.expose |     @cherrypy.expose | ||||||
| @@ -165,13 +70,40 @@ class Root(NilmApp): | |||||||
|         """Return a dictionary with the database path, |         """Return a dictionary with the database path, | ||||||
|         size of the database in bytes, and free disk space in bytes""" |         size of the database in bytes, and free disk space in bytes""" | ||||||
|         path = self.db.get_basepath() |         path = self.db.get_basepath() | ||||||
|  |         usage = psutil.disk_usage(path) | ||||||
|  |         dbsize = nilmdb.utils.du(path) | ||||||
|         return { "path": path, |         return { "path": path, | ||||||
|                  "size": nilmdb.utils.du(path), |                  "size": dbsize, | ||||||
|                  "free": psutil.disk_usage(path).free } |                  "other": usage.used - dbsize, | ||||||
|  |                  "reserved": usage.total - usage.used - usage.free, | ||||||
|  |                  "free": usage.free } | ||||||
|  |  | ||||||
| class Stream(NilmApp): | class Stream(NilmApp): | ||||||
|     """Stream-specific operations""" |     """Stream-specific operations""" | ||||||
|  |  | ||||||
|  |     # Helpers | ||||||
|  |     def _get_times(self, start_param, end_param): | ||||||
|  |         (start, end) = (None, None) | ||||||
|  |         try: | ||||||
|  |             if start_param is not None: | ||||||
|  |                 start = string_to_timestamp(start_param) | ||||||
|  |         except Exception: | ||||||
|  |             raise cherrypy.HTTPError("400 Bad Request", sprintf( | ||||||
|  |                 "invalid start (%s): must be a numeric timestamp", start_param)) | ||||||
|  |         try: | ||||||
|  |             if end_param is not None: | ||||||
|  |                 end = string_to_timestamp(end_param) | ||||||
|  |         except Exception: | ||||||
|  |             raise cherrypy.HTTPError("400 Bad Request", sprintf( | ||||||
|  |                 "invalid end (%s): must be a numeric timestamp", end_param)) | ||||||
|  |         if start is not None and end is not None: | ||||||
|  |             if start >= end: | ||||||
|  |                 raise cherrypy.HTTPError( | ||||||
|  |                     "400 Bad Request", | ||||||
|  |                     sprintf("start must precede end (%s >= %s)", | ||||||
|  |                             start_param, end_param)) | ||||||
|  |         return (start, end) | ||||||
|  |  | ||||||
|     # /stream/list |     # /stream/list | ||||||
|     # /stream/list?layout=float32_8 |     # /stream/list?layout=float32_8 | ||||||
|     # /stream/list?path=/newton/prep&extended=1 |     # /stream/list?path=/newton/prep&extended=1 | ||||||
| @@ -182,10 +114,10 @@ class Stream(NilmApp): | |||||||
|         layout parameter, just list streams that match the given path |         layout parameter, just list streams that match the given path | ||||||
|         or layout. |         or layout. | ||||||
|  |  | ||||||
|         If extent is not given, returns a list of lists containing |         If extended is missing or zero, returns a list of lists | ||||||
|         the path and layout: [ path, layout ] |         containing the path and layout: [ path, layout ] | ||||||
|  |  | ||||||
|         If extended is provided, returns a list of lists containing |         If extended is true, returns a list of lists containing | ||||||
|         extended info: [ path, layout, extent_min, extent_max, |         extended info: [ path, layout, extent_min, extent_max, | ||||||
|         total_rows, total_seconds ].  More data may be added. |         total_rows, total_seconds ].  More data may be added. | ||||||
|         """ |         """ | ||||||
| @@ -210,7 +142,7 @@ class Stream(NilmApp): | |||||||
|     @exception_to_httperror(NilmDBError) |     @exception_to_httperror(NilmDBError) | ||||||
|     @cherrypy.tools.CORS_allow(methods = ["POST"]) |     @cherrypy.tools.CORS_allow(methods = ["POST"]) | ||||||
|     def destroy(self, path): |     def destroy(self, path): | ||||||
|         """Delete a stream and its associated data.""" |         """Delete a stream.  Fails if any data is still present.""" | ||||||
|         return self.db.stream_destroy(path) |         return self.db.stream_destroy(path) | ||||||
|  |  | ||||||
|     # /stream/rename?oldpath=/newton/prep&newpath=/newton/prep/1 |     # /stream/rename?oldpath=/newton/prep&newpath=/newton/prep/1 | ||||||
| @@ -288,32 +220,42 @@ class Stream(NilmApp): | |||||||
|     @cherrypy.tools.json_out() |     @cherrypy.tools.json_out() | ||||||
|     @exception_to_httperror(NilmDBError, ValueError) |     @exception_to_httperror(NilmDBError, ValueError) | ||||||
|     @cherrypy.tools.CORS_allow(methods = ["PUT"]) |     @cherrypy.tools.CORS_allow(methods = ["PUT"]) | ||||||
|     def insert(self, path, start, end): |     def insert(self, path, start, end, binary = False): | ||||||
|         """ |         """ | ||||||
|         Insert new data into the database.  Provide textual data |         Insert new data into the database.  Provide textual data | ||||||
|         (matching the path's layout) as a HTTP PUT. |         (matching the path's layout) as a HTTP PUT. | ||||||
|  |  | ||||||
|  |         If 'binary' is True, expect raw binary data, rather than lines | ||||||
|  |         of ASCII-formatted data.  Raw binary data is always | ||||||
|  |         little-endian and matches the database types (including an | ||||||
|  |         int64 timestamp). | ||||||
|         """ |         """ | ||||||
|  |         binary = bool_param(binary) | ||||||
|  |  | ||||||
|         # Important that we always read the input before throwing any |         # Important that we always read the input before throwing any | ||||||
|         # errors, to keep lengths happy for persistent connections. |         # errors, to keep lengths happy for persistent connections. | ||||||
|         # Note that CherryPy 3.2.2 has a bug where this fails for GET |         # Note that CherryPy 3.2.2 has a bug where this fails for GET | ||||||
|         # requests, if we ever want to handle those (issue #1134) |         # requests, if we ever want to handle those (issue #1134) | ||||||
|         body = cherrypy.request.body.read() |         body = cherrypy.request.body.read() | ||||||
|  |  | ||||||
|  |         # Verify content type for binary data | ||||||
|  |         content_type = cherrypy.request.headers.get('content-type') | ||||||
|  |         if binary and content_type: | ||||||
|  |             if content_type != "application/octet-stream": | ||||||
|  |                 raise cherrypy.HTTPError("400", "Content type must be " | ||||||
|  |                                          "application/octet-stream for " | ||||||
|  |                                          "binary data, not " + content_type) | ||||||
|  |  | ||||||
|         # Check path and get layout |         # Check path and get layout | ||||||
|         streams = self.db.stream_list(path = path) |         if len(self.db.stream_list(path = path)) != 1: | ||||||
|         if len(streams) != 1: |             raise cherrypy.HTTPError("404", "No such stream: " + path) | ||||||
|             raise cherrypy.HTTPError("404 Not Found", "No such stream") |  | ||||||
|  |  | ||||||
|         # Check limits |         # Check limits | ||||||
|         start = string_to_timestamp(start) |         (start, end) = self._get_times(start, end) | ||||||
|         end = string_to_timestamp(end) |  | ||||||
|         if start >= end: |  | ||||||
|             raise cherrypy.HTTPError("400 Bad Request", |  | ||||||
|                                      "start must precede end") |  | ||||||
|  |  | ||||||
|         # Pass the data directly to nilmdb, which will parse it and |         # Pass the data directly to nilmdb, which will parse it and | ||||||
|         # raise a ValueError if there are any problems. |         # raise a ValueError if there are any problems. | ||||||
|         self.db.stream_insert(path, start, end, body) |         self.db.stream_insert(path, start, end, body, binary) | ||||||
|  |  | ||||||
|         # Done |         # Done | ||||||
|         return |         return | ||||||
| @@ -322,24 +264,34 @@ class Stream(NilmApp): | |||||||
|     # /stream/remove?path=/newton/prep&start=1234567890.0&end=1234567899.0 |     # /stream/remove?path=/newton/prep&start=1234567890.0&end=1234567899.0 | ||||||
|     @cherrypy.expose |     @cherrypy.expose | ||||||
|     @cherrypy.tools.json_in() |     @cherrypy.tools.json_in() | ||||||
|     @cherrypy.tools.json_out() |  | ||||||
|     @exception_to_httperror(NilmDBError) |  | ||||||
|     @cherrypy.tools.CORS_allow(methods = ["POST"]) |     @cherrypy.tools.CORS_allow(methods = ["POST"]) | ||||||
|  |     @chunked_response | ||||||
|  |     @response_type("application/x-json-stream") | ||||||
|     def remove(self, path, start = None, end = None): |     def remove(self, path, start = None, end = None): | ||||||
|         """ |         """ | ||||||
|         Remove data from the backend database.  Removes all data in |         Remove data from the backend database.  Removes all data in | ||||||
|         the interval [start, end).  Returns the number of data points |         the interval [start, end). | ||||||
|         removed. |  | ||||||
|  |         Returns the number of data points removed.  Since this is a potentially | ||||||
|  |         long-running operation, multiple numbers may be returned as the | ||||||
|  |         data gets removed from the backend database.  The total number of | ||||||
|  |         points removed is the sum of all of these numbers. | ||||||
|         """ |         """ | ||||||
|         if start is not None: |         (start, end) = self._get_times(start, end) | ||||||
|             start = string_to_timestamp(start) |  | ||||||
|         if end is not None: |         if len(self.db.stream_list(path = path)) != 1: | ||||||
|             end = string_to_timestamp(end) |             raise cherrypy.HTTPError("404", "No such stream: " + path) | ||||||
|         if start is not None and end is not None: |  | ||||||
|             if start >= end: |         @workaround_cp_bug_1200 | ||||||
|                 raise cherrypy.HTTPError("400 Bad Request", |         def content(start, end): | ||||||
|                                          "start must precede end") |             # Note: disable chunked responses to see tracebacks from here. | ||||||
|         return self.db.stream_remove(path, start, end) |             while True: | ||||||
|  |                 (removed, restart) = self.db.stream_remove(path, start, end) | ||||||
|  |                 yield json.dumps(removed) + "\r\n" | ||||||
|  |                 if restart is None: | ||||||
|  |                     break | ||||||
|  |                 start = restart | ||||||
|  |         return content(start, end) | ||||||
|  |  | ||||||
|     # /stream/intervals?path=/newton/prep |     # /stream/intervals?path=/newton/prep | ||||||
|     # /stream/intervals?path=/newton/prep&start=1234567890.0&end=1234567899.0 |     # /stream/intervals?path=/newton/prep&start=1234567890.0&end=1234567899.0 | ||||||
| @@ -362,15 +314,7 @@ class Stream(NilmApp): | |||||||
|         Note that the response type is the non-standard |         Note that the response type is the non-standard | ||||||
|         'application/x-json-stream' for lack of a better option. |         'application/x-json-stream' for lack of a better option. | ||||||
|         """ |         """ | ||||||
|         if start is not None: |         (start, end) = self._get_times(start, end) | ||||||
|             start = string_to_timestamp(start) |  | ||||||
|         if end is not None: |  | ||||||
|             end = string_to_timestamp(end) |  | ||||||
|  |  | ||||||
|         if start is not None and end is not None: |  | ||||||
|             if start >= end: |  | ||||||
|                 raise cherrypy.HTTPError("400 Bad Request", |  | ||||||
|                                          "start must precede end") |  | ||||||
|  |  | ||||||
|         if len(self.db.stream_list(path = path)) != 1: |         if len(self.db.stream_list(path = path)) != 1: | ||||||
|             raise cherrypy.HTTPError("404", "No such stream: " + path) |             raise cherrypy.HTTPError("404", "No such stream: " + path) | ||||||
| @@ -386,7 +330,7 @@ class Stream(NilmApp): | |||||||
|                                                            diffpath) |                                                            diffpath) | ||||||
|                 response = ''.join([ json.dumps(i) + "\r\n" for i in ints ]) |                 response = ''.join([ json.dumps(i) + "\r\n" for i in ints ]) | ||||||
|                 yield response |                 yield response | ||||||
|                 if restart == 0: |                 if restart is None: | ||||||
|                     break |                     break | ||||||
|                 start = restart |                 start = restart | ||||||
|         return content(start, end) |         return content(start, end) | ||||||
| @@ -394,48 +338,62 @@ class Stream(NilmApp): | |||||||
|     # /stream/extract?path=/newton/prep&start=1234567890.0&end=1234567899.0 |     # /stream/extract?path=/newton/prep&start=1234567890.0&end=1234567899.0 | ||||||
|     @cherrypy.expose |     @cherrypy.expose | ||||||
|     @chunked_response |     @chunked_response | ||||||
|     @response_type("text/plain") |     def extract(self, path, start = None, end = None, | ||||||
|     def extract(self, path, start = None, end = None, count = False): |                 count = False, markup = False, binary = False): | ||||||
|         """ |         """ | ||||||
|         Extract data from backend database.  Streams the resulting |         Extract data from backend database.  Streams the resulting | ||||||
|         entries as ASCII text lines separated by newlines.  This may |         entries as ASCII text lines separated by newlines.  This may | ||||||
|         make multiple requests to the nilmdb backend to avoid causing |         make multiple requests to the nilmdb backend to avoid causing | ||||||
|         it to block for too long. |         it to block for too long. | ||||||
|  |  | ||||||
|         Add count=True to return a count rather than actual data. |         If 'count' is True, returns a count rather than actual data. | ||||||
|         """ |  | ||||||
|         if start is not None: |  | ||||||
|             start = string_to_timestamp(start) |  | ||||||
|         if end is not None: |  | ||||||
|             end = string_to_timestamp(end) |  | ||||||
|  |  | ||||||
|         # Check parameters |         If 'markup' is True, adds comments to the stream denoting each | ||||||
|         if start is not None and end is not None: |         interval's start and end timestamp. | ||||||
|             if start >= end: |  | ||||||
|                 raise cherrypy.HTTPError("400 Bad Request", |         If 'binary' is True, return raw binary data, rather than lines | ||||||
|                                          "start must precede end") |         of ASCII-formatted data.  Raw binary data is always | ||||||
|  |         little-endian and matches the database types (including an | ||||||
|  |         int64 timestamp). | ||||||
|  |         """ | ||||||
|  |         binary = bool_param(binary) | ||||||
|  |         markup = bool_param(markup) | ||||||
|  |         count = bool_param(count) | ||||||
|  |  | ||||||
|  |         (start, end) = self._get_times(start, end) | ||||||
|  |  | ||||||
|         # Check path and get layout |         # Check path and get layout | ||||||
|         streams = self.db.stream_list(path = path) |         if len(self.db.stream_list(path = path)) != 1: | ||||||
|         if len(streams) != 1: |             raise cherrypy.HTTPError("404", "No such stream: " + path) | ||||||
|             raise cherrypy.HTTPError("404 Not Found", "No such stream") |  | ||||||
|  |         if binary: | ||||||
|  |             content_type = "application/octet-stream" | ||||||
|  |             if markup or count: | ||||||
|  |                 raise cherrypy.HTTPError("400", "can't mix binary and " | ||||||
|  |                                          "markup or count modes") | ||||||
|  |         else: | ||||||
|  |             content_type = "text/plain" | ||||||
|  |         cherrypy.response.headers['Content-Type'] = content_type | ||||||
|  |  | ||||||
|         @workaround_cp_bug_1200 |         @workaround_cp_bug_1200 | ||||||
|         def content(start, end, count): |         def content(start, end): | ||||||
|             # Note: disable chunked responses to see tracebacks from here. |             # Note: disable chunked responses to see tracebacks from here. | ||||||
|             if count: |             if count: | ||||||
|                 matched = self.db.stream_extract(path, start, end, count) |                 matched = self.db.stream_extract(path, start, end, | ||||||
|  |                                                  count = True) | ||||||
|                 yield sprintf("%d\n", matched) |                 yield sprintf("%d\n", matched) | ||||||
|                 return |                 return | ||||||
|  |  | ||||||
|             while True: |             while True: | ||||||
|                 (data, restart) = self.db.stream_extract(path, start, end) |                 (data, restart) = self.db.stream_extract( | ||||||
|  |                     path, start, end, count = False, | ||||||
|  |                     markup = markup, binary = binary) | ||||||
|                 yield data |                 yield data | ||||||
|  |  | ||||||
|                 if restart == 0: |                 if restart is None: | ||||||
|                     return |                     return | ||||||
|                 start = restart |                 start = restart | ||||||
|         return content(start, end, count) |         return content(start, end) | ||||||
|  |  | ||||||
| class Exiter(object): | class Exiter(object): | ||||||
|     """App that exits the server, for testing""" |     """App that exits the server, for testing""" | ||||||
| @@ -453,7 +411,8 @@ class Server(object): | |||||||
|                  stoppable = False,       # whether /exit URL exists |                  stoppable = False,       # whether /exit URL exists | ||||||
|                  embedded = True,         # hide diagnostics and output, etc |                  embedded = True,         # hide diagnostics and output, etc | ||||||
|                  fast_shutdown = False,   # don't wait for clients to disconn. |                  fast_shutdown = False,   # don't wait for clients to disconn. | ||||||
|                  force_traceback = False  # include traceback in all errors |                  force_traceback = False, # include traceback in all errors | ||||||
|  |                  basepath = '',           # base URL path for cherrypy.tree | ||||||
|                  ): |                  ): | ||||||
|         # Save server version, just for verification during tests |         # Save server version, just for verification during tests | ||||||
|         self.version = nilmdb.__version__ |         self.version = nilmdb.__version__ | ||||||
| @@ -513,7 +472,7 @@ class Server(object): | |||||||
|         if stoppable: |         if stoppable: | ||||||
|             root.exit = Exiter() |             root.exit = Exiter() | ||||||
|         cherrypy.tree.apps = {} |         cherrypy.tree.apps = {} | ||||||
|         cherrypy.tree.mount(root, "/", config = { "/" : app_config }) |         cherrypy.tree.mount(root, basepath, config = { "/" : app_config }) | ||||||
|  |  | ||||||
|         # Shutdowns normally wait for clients to disconnect.  To speed |         # Shutdowns normally wait for clients to disconnect.  To speed | ||||||
|         # up tests, set fast_shutdown = True |         # up tests, set fast_shutdown = True | ||||||
| @@ -523,69 +482,68 @@ class Server(object): | |||||||
|         else: |         else: | ||||||
|             cherrypy.server.shutdown_timeout = 5 |             cherrypy.server.shutdown_timeout = 5 | ||||||
|  |  | ||||||
|  |         # Set up the WSGI application pointer for external programs | ||||||
|  |         self.wsgi_application = cherrypy.tree | ||||||
|  |  | ||||||
|     def json_error_page(self, status, message, traceback, version): |     def json_error_page(self, status, message, traceback, version): | ||||||
|         """Return a custom error page in JSON so the client can parse it""" |         """Return a custom error page in JSON so the client can parse it""" | ||||||
|         errordata = { "status" : status, |         return json_error_page(status, message, traceback, version, | ||||||
|                       "message" : message, |                                self.force_traceback) | ||||||
|                       "traceback" : traceback } |  | ||||||
|         # Don't send a traceback if the error was 400-499 (client's fault) |  | ||||||
|         try: |  | ||||||
|             code = int(status.split()[0]) |  | ||||||
|             if not self.force_traceback: |  | ||||||
|                 if code >= 400 and code <= 499: |  | ||||||
|                     errordata["traceback"] = "" |  | ||||||
|         except Exception: # pragma: no cover |  | ||||||
|             pass |  | ||||||
|         # Override the response type, which was previously set to text/html |  | ||||||
|         cherrypy.serving.response.headers['Content-Type'] = ( |  | ||||||
|             "application/json;charset=utf-8" ) |  | ||||||
|         # Undo the HTML escaping that cherrypy's get_error_page function applies |  | ||||||
|         # (cherrypy issue 1135) |  | ||||||
|         for k, v in errordata.iteritems(): |  | ||||||
|             v = v.replace("<","<") |  | ||||||
|             v = v.replace(">",">") |  | ||||||
|             v = v.replace("&","&") |  | ||||||
|             errordata[k] = v |  | ||||||
|         return json.dumps(errordata, separators=(',',':')) |  | ||||||
|  |  | ||||||
|     def start(self, blocking = False, event = None): |     def start(self, blocking = False, event = None): | ||||||
|  |         cherrypy_start(blocking, event, self.embedded) | ||||||
|         if not self.embedded: # pragma: no cover |  | ||||||
|             # Handle signals nicely |  | ||||||
|             if hasattr(cherrypy.engine, "signal_handler"): |  | ||||||
|                 cherrypy.engine.signal_handler.subscribe() |  | ||||||
|             if hasattr(cherrypy.engine, "console_control_handler"): |  | ||||||
|                 cherrypy.engine.console_control_handler.subscribe() |  | ||||||
|  |  | ||||||
|         # Cherrypy stupidly calls os._exit(70) when it can't bind the |  | ||||||
|         # port.  At least try to print a reasonable error and continue |  | ||||||
|         # in this case, rather than just dying silently (as we would |  | ||||||
|         # otherwise do in embedded mode) |  | ||||||
|         real_exit = os._exit |  | ||||||
|         def fake_exit(code): # pragma: no cover |  | ||||||
|             if code == os.EX_SOFTWARE: |  | ||||||
|                 fprintf(sys.stderr, "error: CherryPy called os._exit!\n") |  | ||||||
|             else: |  | ||||||
|                 real_exit(code) |  | ||||||
|         os._exit = fake_exit |  | ||||||
|         cherrypy.engine.start() |  | ||||||
|         os._exit = real_exit |  | ||||||
|  |  | ||||||
|         # Signal that the engine has started successfully |  | ||||||
|         if event is not None: |  | ||||||
|             event.set() |  | ||||||
|  |  | ||||||
|         if blocking: |  | ||||||
|             try: |  | ||||||
|                 cherrypy.engine.wait(cherrypy.engine.states.EXITING, |  | ||||||
|                                      interval = 0.1, channel = 'main') |  | ||||||
|             except (KeyboardInterrupt, IOError): # pragma: no cover |  | ||||||
|                 cherrypy.engine.log('Keyboard Interrupt: shutting down bus') |  | ||||||
|                 cherrypy.engine.exit() |  | ||||||
|             except SystemExit: # pragma: no cover |  | ||||||
|                 cherrypy.engine.log('SystemExit raised: shutting down bus') |  | ||||||
|                 cherrypy.engine.exit() |  | ||||||
|                 raise |  | ||||||
|  |  | ||||||
|     def stop(self): |     def stop(self): | ||||||
|         cherrypy.engine.exit() |         cherrypy_stop() | ||||||
|  |  | ||||||
|  | # Use a single global nilmdb.server.NilmDB and nilmdb.server.Server | ||||||
|  | # instance since the database can only be opened once.  For this to | ||||||
|  | # work, the web server must use only a single process and single | ||||||
|  | # Python interpreter.  Multiple threads are OK. | ||||||
|  | _wsgi_server = None | ||||||
|  | def wsgi_application(dbpath, basepath): # pragma: no cover | ||||||
|  |     """Return a WSGI application object with a database at the | ||||||
|  |     specified path. | ||||||
|  |  | ||||||
|  |     'dbpath' is a filesystem location, e.g. /home/nilm/db | ||||||
|  |  | ||||||
|  |     'basepath' is the URL path of the application base, which | ||||||
|  |     is the same as the first argument to Apache's WSGIScriptAlias | ||||||
|  |     directive. | ||||||
|  |     """ | ||||||
|  |     def application(environ, start_response): | ||||||
|  |         global _wsgi_server | ||||||
|  |         if _wsgi_server is None: | ||||||
|  |             # Try to start the server | ||||||
|  |             try: | ||||||
|  |                 db = nilmdb.utils.serializer_proxy(nilmdb.server.NilmDB)(dbpath) | ||||||
|  |                 _wsgi_server = nilmdb.server.Server( | ||||||
|  |                     db, embedded = True, | ||||||
|  |                     basepath = basepath.rstrip('/')) | ||||||
|  |             except Exception: | ||||||
|  |                 # Build an error message on failure | ||||||
|  |                 import pprint | ||||||
|  |                 err = sprintf("Initializing database at path '%s' failed:\n\n", | ||||||
|  |                               dbpath) | ||||||
|  |                 err += traceback.format_exc() | ||||||
|  |                 try: | ||||||
|  |                     import pwd | ||||||
|  |                     import grp | ||||||
|  |                     err += sprintf("\nRunning as: uid=%d (%s), gid=%d (%s) " | ||||||
|  |                                    "on host %s, pid %d\n", | ||||||
|  |                                    os.getuid(), pwd.getpwuid(os.getuid())[0], | ||||||
|  |                                    os.getgid(), grp.getgrgid(os.getgid())[0], | ||||||
|  |                                    socket.gethostname(), os.getpid()) | ||||||
|  |                 except ImportError: | ||||||
|  |                     pass | ||||||
|  |                 err += sprintf("\nEnvironment:\n%s\n", pprint.pformat(environ)) | ||||||
|  |         if _wsgi_server is None: | ||||||
|  |             # Serve up the error with our own mini WSGI app. | ||||||
|  |             headers = [ ('Content-type', 'text/plain'), | ||||||
|  |                         ('Content-length', str(len(err))) ] | ||||||
|  |             start_response("500 Internal Server Error", headers) | ||||||
|  |             return [err] | ||||||
|  |  | ||||||
|  |         # Call the normal application | ||||||
|  |         return _wsgi_server.wsgi_application(environ, start_response) | ||||||
|  |     return application | ||||||
|   | |||||||
							
								
								
									
										214
									
								
								nilmdb/server/serverutil.py
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										214
									
								
								nilmdb/server/serverutil.py
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,214 @@ | |||||||
|  | """Miscellaneous decorators and other helpers for running a CherryPy | ||||||
|  | server""" | ||||||
|  |  | ||||||
|  | import cherrypy | ||||||
|  | import sys | ||||||
|  | import os | ||||||
|  | import decorator | ||||||
|  | import simplejson as json | ||||||
|  |  | ||||||
|  | # Helper to parse parameters into booleans | ||||||
|  | def bool_param(s): | ||||||
|  |     """Return a bool indicating whether parameter 's' was True or False, | ||||||
|  |     supporting a few different types for 's'.""" | ||||||
|  |     try: | ||||||
|  |         ss = s.lower() | ||||||
|  |         if ss in [ "0", "false", "f", "no", "n" ]: | ||||||
|  |             return False | ||||||
|  |         if ss in [ "1", "true", "t", "yes", "y" ]: | ||||||
|  |             return True | ||||||
|  |     except Exception: | ||||||
|  |         return bool(s) | ||||||
|  |     raise cherrypy.HTTPError("400 Bad Request", | ||||||
|  |                              "can't parse parameter: " + ss) | ||||||
|  |  | ||||||
|  | # Decorators | ||||||
|  | def chunked_response(func): | ||||||
|  |     """Decorator to enable chunked responses.""" | ||||||
|  |     # Set this to False to get better tracebacks from some requests | ||||||
|  |     # (/stream/extract, /stream/intervals). | ||||||
|  |     func._cp_config = { 'response.stream': True } | ||||||
|  |     return func | ||||||
|  |  | ||||||
|  | def response_type(content_type): | ||||||
|  |     """Return a decorator-generating function that sets the | ||||||
|  |     response type to the specified string.""" | ||||||
|  |     def wrapper(func, *args, **kwargs): | ||||||
|  |         cherrypy.response.headers['Content-Type'] = content_type | ||||||
|  |         return func(*args, **kwargs) | ||||||
|  |     return decorator.decorator(wrapper) | ||||||
|  |  | ||||||
|  | @decorator.decorator | ||||||
|  | def workaround_cp_bug_1200(func, *args, **kwargs): # pragma: no cover | ||||||
|  |     """Decorator to work around CherryPy bug #1200 in a response | ||||||
|  |     generator. | ||||||
|  |  | ||||||
|  |     Even if chunked responses are disabled, LookupError or | ||||||
|  |     UnicodeError exceptions may still be swallowed by CherryPy due to | ||||||
|  |     bug #1200.  This throws them as generic Exceptions instead so that | ||||||
|  |     they make it through. | ||||||
|  |     """ | ||||||
|  |     exc_info = None | ||||||
|  |     try: | ||||||
|  |         for val in func(*args, **kwargs): | ||||||
|  |             yield val | ||||||
|  |     except (LookupError, UnicodeError): | ||||||
|  |         # Re-raise it, but maintain the original traceback | ||||||
|  |         exc_info = sys.exc_info() | ||||||
|  |         new_exc = Exception(exc_info[0].__name__ + ": " + str(exc_info[1])) | ||||||
|  |         raise new_exc, None, exc_info[2] | ||||||
|  |     finally: | ||||||
|  |         del exc_info | ||||||
|  |  | ||||||
|  | def exception_to_httperror(*expected): | ||||||
|  |     """Return a decorator-generating function that catches expected | ||||||
|  |     errors and throws a HTTPError describing it instead. | ||||||
|  |  | ||||||
|  |         @exception_to_httperror(NilmDBError, ValueError) | ||||||
|  |         def foo(): | ||||||
|  |             pass | ||||||
|  |     """ | ||||||
|  |     def wrapper(func, *args, **kwargs): | ||||||
|  |         exc_info = None | ||||||
|  |         try: | ||||||
|  |             return func(*args, **kwargs) | ||||||
|  |         except expected: | ||||||
|  |             # Re-raise it, but maintain the original traceback | ||||||
|  |             exc_info = sys.exc_info() | ||||||
|  |             new_exc = cherrypy.HTTPError("400 Bad Request", str(exc_info[1])) | ||||||
|  |             raise new_exc, None, exc_info[2] | ||||||
|  |         finally: | ||||||
|  |             del exc_info | ||||||
|  |     # We need to preserve the function's argspecs for CherryPy to | ||||||
|  |     # handle argument errors correctly.  Decorator.decorator takes | ||||||
|  |     # care of that. | ||||||
|  |     return decorator.decorator(wrapper) | ||||||
|  |  | ||||||
|  | # Custom CherryPy tools | ||||||
|  |  | ||||||
|  | def CORS_allow(methods): | ||||||
|  |     """This does several things: | ||||||
|  |  | ||||||
|  |     Handles CORS preflight requests. | ||||||
|  |     Adds Allow: header to all requests. | ||||||
|  |     Raise 405 if request.method not in method. | ||||||
|  |  | ||||||
|  |     It is similar to cherrypy.tools.allow, with the CORS stuff added. | ||||||
|  |  | ||||||
|  |     Add this to CherryPy with: | ||||||
|  |     cherrypy.tools.CORS_allow = cherrypy.Tool('on_start_resource', CORS_allow) | ||||||
|  |     """ | ||||||
|  |     request = cherrypy.request.headers | ||||||
|  |     response = cherrypy.response.headers | ||||||
|  |  | ||||||
|  |     if not isinstance(methods, (tuple, list)): # pragma: no cover | ||||||
|  |         methods = [ methods ] | ||||||
|  |     methods = [ m.upper() for m in methods if m ] | ||||||
|  |     if not methods: # pragma: no cover | ||||||
|  |         methods = [ 'GET', 'HEAD' ] | ||||||
|  |     elif 'GET' in methods and 'HEAD' not in methods: # pragma: no cover | ||||||
|  |         methods.append('HEAD') | ||||||
|  |     response['Allow'] = ', '.join(methods) | ||||||
|  |  | ||||||
|  |     # Allow all origins | ||||||
|  |     if 'Origin' in request: | ||||||
|  |         response['Access-Control-Allow-Origin'] = request['Origin'] | ||||||
|  |  | ||||||
|  |     # If it's a CORS request, send response. | ||||||
|  |     request_method = request.get("Access-Control-Request-Method", None) | ||||||
|  |     request_headers = request.get("Access-Control-Request-Headers", None) | ||||||
|  |     if (cherrypy.request.method == "OPTIONS" and | ||||||
|  |         request_method and request_headers): | ||||||
|  |         response['Access-Control-Allow-Headers'] = request_headers | ||||||
|  |         response['Access-Control-Allow-Methods'] = ', '.join(methods) | ||||||
|  |         # Try to stop further processing and return a 200 OK | ||||||
|  |         cherrypy.response.status = "200 OK" | ||||||
|  |         cherrypy.response.body = "" | ||||||
|  |         cherrypy.request.handler = lambda: "" | ||||||
|  |         return | ||||||
|  |  | ||||||
|  |     # Reject methods that were not explicitly allowed | ||||||
|  |     if cherrypy.request.method not in methods: | ||||||
|  |         raise cherrypy.HTTPError(405) | ||||||
|  |  | ||||||
|  |  | ||||||
|  | # Helper for json_in tool to process JSON data into normal request | ||||||
|  | # parameters. | ||||||
|  | def json_to_request_params(body): | ||||||
|  |     cherrypy.lib.jsontools.json_processor(body) | ||||||
|  |     if not isinstance(cherrypy.request.json, dict): | ||||||
|  |         raise cherrypy.HTTPError(415) | ||||||
|  |     cherrypy.request.params.update(cherrypy.request.json) | ||||||
|  |  | ||||||
|  | # Used as an "error_page.default" handler | ||||||
|  | def json_error_page(status, message, traceback, version, | ||||||
|  |                     force_traceback = False): | ||||||
|  |     """Return a custom error page in JSON so the client can parse it""" | ||||||
|  |     errordata = { "status" : status, | ||||||
|  |                   "message" : message, | ||||||
|  |                   "traceback" : traceback } | ||||||
|  |     # Don't send a traceback if the error was 400-499 (client's fault) | ||||||
|  |     try: | ||||||
|  |         code = int(status.split()[0]) | ||||||
|  |         if not force_traceback: | ||||||
|  |             if code >= 400 and code <= 499: | ||||||
|  |                 errordata["traceback"] = "" | ||||||
|  |     except Exception: # pragma: no cover | ||||||
|  |         pass | ||||||
|  |     # Override the response type, which was previously set to text/html | ||||||
|  |     cherrypy.serving.response.headers['Content-Type'] = ( | ||||||
|  |         "application/json;charset=utf-8" ) | ||||||
|  |     # Undo the HTML escaping that cherrypy's get_error_page function applies | ||||||
|  |     # (cherrypy issue 1135) | ||||||
|  |     for k, v in errordata.iteritems(): | ||||||
|  |         v = v.replace("<","<") | ||||||
|  |         v = v.replace(">",">") | ||||||
|  |         v = v.replace("&","&") | ||||||
|  |         errordata[k] = v | ||||||
|  |     return json.dumps(errordata, separators=(',',':')) | ||||||
|  |  | ||||||
|  | # Start/stop CherryPy standalone server | ||||||
|  | def cherrypy_start(blocking = False, event = False, embedded = False): | ||||||
|  |     """Start the CherryPy server, handling errors and signals | ||||||
|  |     somewhat gracefully.""" | ||||||
|  |  | ||||||
|  |     if not embedded: # pragma: no cover | ||||||
|  |         # Handle signals nicely | ||||||
|  |         if hasattr(cherrypy.engine, "signal_handler"): | ||||||
|  |             cherrypy.engine.signal_handler.subscribe() | ||||||
|  |         if hasattr(cherrypy.engine, "console_control_handler"): | ||||||
|  |             cherrypy.engine.console_control_handler.subscribe() | ||||||
|  |  | ||||||
|  |     # Cherrypy stupidly calls os._exit(70) when it can't bind the | ||||||
|  |     # port.  At least try to print a reasonable error and continue | ||||||
|  |     # in this case, rather than just dying silently (as we would | ||||||
|  |     # otherwise do in embedded mode) | ||||||
|  |     real_exit = os._exit | ||||||
|  |     def fake_exit(code): # pragma: no cover | ||||||
|  |         if code == os.EX_SOFTWARE: | ||||||
|  |             fprintf(sys.stderr, "error: CherryPy called os._exit!\n") | ||||||
|  |         else: | ||||||
|  |             real_exit(code) | ||||||
|  |     os._exit = fake_exit | ||||||
|  |     cherrypy.engine.start() | ||||||
|  |     os._exit = real_exit | ||||||
|  |  | ||||||
|  |     # Signal that the engine has started successfully | ||||||
|  |     if event is not None: | ||||||
|  |         event.set() | ||||||
|  |  | ||||||
|  |     if blocking: | ||||||
|  |         try: | ||||||
|  |             cherrypy.engine.wait(cherrypy.engine.states.EXITING, | ||||||
|  |                                  interval = 0.1, channel = 'main') | ||||||
|  |         except (KeyboardInterrupt, IOError): # pragma: no cover | ||||||
|  |             cherrypy.engine.log('Keyboard Interrupt: shutting down bus') | ||||||
|  |             cherrypy.engine.exit() | ||||||
|  |         except SystemExit: # pragma: no cover | ||||||
|  |             cherrypy.engine.log('SystemExit raised: shutting down bus') | ||||||
|  |             cherrypy.engine.exit() | ||||||
|  |             raise | ||||||
|  |  | ||||||
|  | # Stop CherryPy server | ||||||
|  | def cherrypy_stop(): | ||||||
|  |     cherrypy.engine.exit() | ||||||
| @@ -1,7 +1,7 @@ | |||||||
| """NilmDB utilities""" | """NilmDB utilities""" | ||||||
|  |  | ||||||
|  | from __future__ import absolute_import | ||||||
| from nilmdb.utils.timer import Timer | from nilmdb.utils.timer import Timer | ||||||
| from nilmdb.utils.iteratorizer import Iteratorizer |  | ||||||
| from nilmdb.utils.serializer import serializer_proxy | from nilmdb.utils.serializer import serializer_proxy | ||||||
| from nilmdb.utils.lrucache import lru_cache | from nilmdb.utils.lrucache import lru_cache | ||||||
| from nilmdb.utils.diskusage import du, human_size | from nilmdb.utils.diskusage import du, human_size | ||||||
| @@ -11,3 +11,7 @@ import nilmdb.utils.threadsafety | |||||||
| import nilmdb.utils.fallocate | import nilmdb.utils.fallocate | ||||||
| import nilmdb.utils.time | import nilmdb.utils.time | ||||||
| import nilmdb.utils.iterator | import nilmdb.utils.iterator | ||||||
|  | import nilmdb.utils.interval | ||||||
|  | import nilmdb.utils.lock | ||||||
|  | import nilmdb.utils.sort | ||||||
|  | import nilmdb.utils.unicode | ||||||
|   | |||||||
| @@ -1,4 +1,5 @@ | |||||||
| import os | import os | ||||||
|  | import errno | ||||||
| from math import log | from math import log | ||||||
|  |  | ||||||
| def human_size(num): | def human_size(num): | ||||||
| @@ -16,10 +17,17 @@ def human_size(num): | |||||||
|         return '1 byte' |         return '1 byte' | ||||||
|  |  | ||||||
| def du(path): | def du(path): | ||||||
|     """Like du -sb, returns total size of path in bytes.""" |     """Like du -sb, returns total size of path in bytes.  Ignore | ||||||
|  |     errors that might occur if we encounter broken symlinks or | ||||||
|  |     files in the process of being removed.""" | ||||||
|  |     try: | ||||||
|         size = os.path.getsize(path) |         size = os.path.getsize(path) | ||||||
|         if os.path.isdir(path): |         if os.path.isdir(path): | ||||||
|             for thisfile in os.listdir(path): |             for thisfile in os.listdir(path): | ||||||
|                 filepath = os.path.join(path, thisfile) |                 filepath = os.path.join(path, thisfile) | ||||||
|                 size += du(filepath) |                 size += du(filepath) | ||||||
|         return size |         return size | ||||||
|  |     except OSError as e: # pragma: no cover | ||||||
|  |         if e.errno != errno.ENOENT: | ||||||
|  |             raise | ||||||
|  |         return 0 | ||||||
|   | |||||||
							
								
								
									
										147
									
								
								nilmdb/utils/interval.py
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										147
									
								
								nilmdb/utils/interval.py
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,147 @@ | |||||||
|  | """Interval.  Like nilmdb.server.interval, but re-implemented here | ||||||
|  | in plain Python so clients have easier access to it, and with a few | ||||||
|  | helper functions. | ||||||
|  |  | ||||||
|  | Intervals are half-open, ie. they include data points with timestamps | ||||||
|  | [start, end) | ||||||
|  | """ | ||||||
|  |  | ||||||
|  | import nilmdb.utils.time | ||||||
|  | import nilmdb.utils.iterator | ||||||
|  |  | ||||||
|  | class IntervalError(Exception): | ||||||
|  |     """Error due to interval overlap, etc""" | ||||||
|  |     pass | ||||||
|  |  | ||||||
|  | # Interval | ||||||
|  | class Interval: | ||||||
|  |     """Represents an interval of time.""" | ||||||
|  |  | ||||||
|  |     def __init__(self, start, end): | ||||||
|  |         """ | ||||||
|  |         'start' and 'end' are arbitrary numbers that represent time | ||||||
|  |         """ | ||||||
|  |         if start >= end: | ||||||
|  |             # Explicitly disallow zero-width intervals (since they're half-open) | ||||||
|  |             raise IntervalError("start %s must precede end %s" % (start, end)) | ||||||
|  |         self.start = start | ||||||
|  |         self.end = end | ||||||
|  |  | ||||||
|  |     def __repr__(self): | ||||||
|  |         s = repr(self.start) + ", " + repr(self.end) | ||||||
|  |         return self.__class__.__name__ + "(" + s + ")" | ||||||
|  |  | ||||||
|  |     def __str__(self): | ||||||
|  |         return ("[" + nilmdb.utils.time.timestamp_to_string(self.start) + | ||||||
|  |                 " -> " + nilmdb.utils.time.timestamp_to_string(self.end) + ")") | ||||||
|  |  | ||||||
|  |     def human_string(self): | ||||||
|  |         return ("[ " + nilmdb.utils.time.timestamp_to_human(self.start) + | ||||||
|  |                 " -> " + nilmdb.utils.time.timestamp_to_human(self.end) + " ]") | ||||||
|  |  | ||||||
|  |     def __cmp__(self, other): | ||||||
|  |         """Compare two intervals.  If non-equal, order by start then end""" | ||||||
|  |         return cmp(self.start, other.start) or cmp(self.end, other.end) | ||||||
|  |  | ||||||
|  |     def intersects(self, other): | ||||||
|  |         """Return True if two Interval objects intersect""" | ||||||
|  |         if not isinstance(other, Interval): | ||||||
|  |             raise TypeError("need an Interval") | ||||||
|  |         if self.end <= other.start or self.start >= other.end: | ||||||
|  |             return False | ||||||
|  |         return True | ||||||
|  |  | ||||||
|  |     def subset(self, start, end): | ||||||
|  |         """Return a new Interval that is a subset of this one""" | ||||||
|  |         # A subclass that tracks additional data might override this. | ||||||
|  |         if start < self.start or end > self.end: | ||||||
|  |             raise IntervalError("not a subset") | ||||||
|  |         return Interval(start, end) | ||||||
|  |  | ||||||
|  | def _interval_math_helper(a, b, op, subset = True): | ||||||
|  |     """Helper for set_difference, intersection functions, | ||||||
|  |     to compute interval subsets based on a math operator on ranges | ||||||
|  |     present in A and B.  Subsets are computed from A, or new intervals | ||||||
|  |     are generated if subset = False.""" | ||||||
|  |     # Iterate through all starts and ends in sorted order.  Add a | ||||||
|  |     # tag to the iterator so that we can figure out which one they | ||||||
|  |     # were, after sorting. | ||||||
|  |     def decorate(it, key_start, key_end): | ||||||
|  |         for i in it: | ||||||
|  |             yield i.start, key_start, i | ||||||
|  |             yield i.end, key_end, i | ||||||
|  |     a_iter = decorate(iter(a), 0, 2) | ||||||
|  |     b_iter = decorate(iter(b), 1, 3) | ||||||
|  |  | ||||||
|  |     # Now iterate over the timestamps of each start and end. | ||||||
|  |     # At each point, evaluate which type of end it is, to determine | ||||||
|  |     # how to build up the output intervals. | ||||||
|  |     a_interval = None | ||||||
|  |     in_a = False | ||||||
|  |     in_b = False | ||||||
|  |     out_start = None | ||||||
|  |     for (ts, k, i) in nilmdb.utils.iterator.imerge(a_iter, b_iter): | ||||||
|  |         if k == 0: | ||||||
|  |             a_interval = i | ||||||
|  |             in_a = True | ||||||
|  |         elif k == 1: | ||||||
|  |             in_b = True | ||||||
|  |         elif k == 2: | ||||||
|  |             in_a = False | ||||||
|  |         elif k == 3: | ||||||
|  |             in_b = False | ||||||
|  |         include = op(in_a, in_b) | ||||||
|  |         if include and out_start is None: | ||||||
|  |             out_start = ts | ||||||
|  |         elif not include: | ||||||
|  |             if out_start is not None and out_start != ts: | ||||||
|  |                 if subset: | ||||||
|  |                     yield a_interval.subset(out_start, ts) | ||||||
|  |                 else: | ||||||
|  |                     yield Interval(out_start, ts) | ||||||
|  |             out_start = None | ||||||
|  |  | ||||||
|  | def set_difference(a, b): | ||||||
|  |     """ | ||||||
|  |     Compute the difference (a \\ b) between the intervals in 'a' and | ||||||
|  |     the intervals in 'b'; i.e., the ranges that are present in 'self' | ||||||
|  |     but not 'other'. | ||||||
|  |  | ||||||
|  |     'a' and 'b' must both be iterables. | ||||||
|  |  | ||||||
|  |     Returns a generator that yields each interval in turn. | ||||||
|  |     Output intervals are built as subsets of the intervals in the | ||||||
|  |     first argument (a). | ||||||
|  |     """ | ||||||
|  |     return _interval_math_helper(a, b, (lambda a, b: a and not b)) | ||||||
|  |  | ||||||
|  | def intersection(a, b): | ||||||
|  |     """ | ||||||
|  |     Compute the intersection between the intervals in 'a' and the | ||||||
|  |     intervals in 'b'; i.e., the ranges that are present in both 'a' | ||||||
|  |     and 'b'. | ||||||
|  |  | ||||||
|  |     'a' and 'b' must both be iterables. | ||||||
|  |  | ||||||
|  |     Returns a generator that yields each interval in turn. | ||||||
|  |     Output intervals are built as subsets of the intervals in the | ||||||
|  |     first argument (a). | ||||||
|  |     """ | ||||||
|  |     return _interval_math_helper(a, b, (lambda a, b: a and b)) | ||||||
|  |  | ||||||
|  | def optimize(it): | ||||||
|  |     """ | ||||||
|  |     Given an iterable 'it' with intervals, optimize them by joining | ||||||
|  |     together intervals that are adjacent in time, and return a generator | ||||||
|  |     that yields the new intervals. | ||||||
|  |     """ | ||||||
|  |     saved_int = None | ||||||
|  |     for interval in it: | ||||||
|  |         if saved_int is not None: | ||||||
|  |             if saved_int.end == interval.start: | ||||||
|  |                 interval.start = saved_int.start | ||||||
|  |             else: | ||||||
|  |                 yield saved_int | ||||||
|  |         saved_int = interval | ||||||
|  |     if saved_int is not None: | ||||||
|  |         yield saved_int | ||||||
| @@ -1,100 +0,0 @@ | |||||||
| import Queue |  | ||||||
| import threading |  | ||||||
| import sys |  | ||||||
| import contextlib |  | ||||||
|  |  | ||||||
| # This file provides a context manager that converts a function |  | ||||||
| # that takes a callback into a generator that returns an iterable. |  | ||||||
| # This is done by running the function in a new thread. |  | ||||||
|  |  | ||||||
| # Based partially on http://stackoverflow.com/questions/9968592/ |  | ||||||
|  |  | ||||||
| class IteratorizerThread(threading.Thread): |  | ||||||
|     def __init__(self, queue, function, curl_hack): |  | ||||||
|         """ |  | ||||||
|         function: function to execute, which takes the |  | ||||||
|         callback (provided by this class) as an argument |  | ||||||
|         """ |  | ||||||
|         threading.Thread.__init__(self) |  | ||||||
|         self.name = "Iteratorizer-" + function.__name__ + "-" + self.name |  | ||||||
|         self.function = function |  | ||||||
|         self.queue = queue |  | ||||||
|         self.die = False |  | ||||||
|         self.curl_hack = curl_hack |  | ||||||
|  |  | ||||||
|     def callback(self, data): |  | ||||||
|         try: |  | ||||||
|             if self.die: |  | ||||||
|                 raise Exception() # trigger termination |  | ||||||
|             self.queue.put((1, data)) |  | ||||||
|         except: |  | ||||||
|             if self.curl_hack: |  | ||||||
|                 # We can't raise exceptions, because the pycurl |  | ||||||
|                 # extension module will unconditionally print the |  | ||||||
|                 # exception itself, and not pass it up to the caller. |  | ||||||
|                 # Instead, just return a value that tells curl to |  | ||||||
|                 # abort.  (-1 would be best, in case we were given 0 |  | ||||||
|                 # bytes, but the extension doesn't support that). |  | ||||||
|                 self.queue.put((2, sys.exc_info())) |  | ||||||
|                 return 0 |  | ||||||
|             raise |  | ||||||
|  |  | ||||||
|     def run(self): |  | ||||||
|         try: |  | ||||||
|             result = self.function(self.callback) |  | ||||||
|         except: |  | ||||||
|             self.queue.put((2, sys.exc_info())) |  | ||||||
|         else: |  | ||||||
|             self.queue.put((0, result)) |  | ||||||
|  |  | ||||||
| @contextlib.contextmanager |  | ||||||
| def Iteratorizer(function, curl_hack = False): |  | ||||||
|     """ |  | ||||||
|     Context manager that takes a function expecting a callback, |  | ||||||
|     and provides an iterable that yields the values passed to that |  | ||||||
|     callback instead. |  | ||||||
|  |  | ||||||
|     function: function to execute, which takes a callback |  | ||||||
|     (provided by this context manager) as an argument |  | ||||||
|  |  | ||||||
|         with iteratorizer(func) as it: |  | ||||||
|             for i in it: |  | ||||||
|                 print 'callback was passed:', i |  | ||||||
|         print 'function returned:', it.retval |  | ||||||
|     """ |  | ||||||
|     queue = Queue.Queue(maxsize = 1) |  | ||||||
|     thread = IteratorizerThread(queue, function, curl_hack) |  | ||||||
|     thread.daemon = True |  | ||||||
|     thread.start() |  | ||||||
|  |  | ||||||
|     class iteratorizer_gen(object): |  | ||||||
|         def __init__(self, queue): |  | ||||||
|             self.queue = queue |  | ||||||
|             self.retval = None |  | ||||||
|  |  | ||||||
|         def __iter__(self): |  | ||||||
|             return self |  | ||||||
|  |  | ||||||
|         def next(self): |  | ||||||
|             (typ, data) = self.queue.get() |  | ||||||
|             if typ == 0: |  | ||||||
|                 # function has returned |  | ||||||
|                 self.retval = data |  | ||||||
|                 raise StopIteration |  | ||||||
|             elif typ == 1: |  | ||||||
|                 # data is available |  | ||||||
|                 return data |  | ||||||
|             else: |  | ||||||
|                 # callback raised an exception |  | ||||||
|                 raise data[0], data[1], data[2] |  | ||||||
|  |  | ||||||
|     try: |  | ||||||
|         yield iteratorizer_gen(queue) |  | ||||||
|     finally: |  | ||||||
|         # Ask the thread to die, if it's still running. |  | ||||||
|         thread.die = True |  | ||||||
|         while thread.isAlive(): |  | ||||||
|             try: |  | ||||||
|                 queue.get(True, 0.01) |  | ||||||
|             except: # pragma: no cover |  | ||||||
|                 pass |  | ||||||
							
								
								
									
										33
									
								
								nilmdb/utils/lock.py
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										33
									
								
								nilmdb/utils/lock.py
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,33 @@ | |||||||
|  | # File locking | ||||||
|  |  | ||||||
|  | import warnings | ||||||
|  |  | ||||||
|  | try: | ||||||
|  |     import fcntl | ||||||
|  |     import errno | ||||||
|  |  | ||||||
|  |     def exclusive_lock(f): | ||||||
|  |         """Acquire an exclusive lock.  Returns True on successful | ||||||
|  |         lock, or False on error.""" | ||||||
|  |         try: | ||||||
|  |             fcntl.flock(f.fileno(), fcntl.LOCK_EX | fcntl.LOCK_NB) | ||||||
|  |         except IOError as e: | ||||||
|  |             if e.errno in (errno.EACCES, errno.EAGAIN): | ||||||
|  |                 return False | ||||||
|  |             else: # pragma: no cover | ||||||
|  |                 raise | ||||||
|  |         return True | ||||||
|  |  | ||||||
|  |     def exclusive_unlock(f): | ||||||
|  |         """Release an exclusive lock.""" | ||||||
|  |         fcntl.flock(f.fileno(), fcntl.LOCK_UN) | ||||||
|  |  | ||||||
|  | except ImportError: # pragma: no cover | ||||||
|  |     def exclusive_lock(f): | ||||||
|  |         """Dummy lock function -- does not lock!""" | ||||||
|  |         warnings.warn("Pretending to lock " + str(f)) | ||||||
|  |         return True | ||||||
|  |  | ||||||
|  |     def exclusive_unlock(f): | ||||||
|  |         """Release an exclusive lock.""" | ||||||
|  |         return | ||||||
| @@ -15,7 +15,7 @@ def must_close(errorfile = sys.stderr, wrap_verify = False): | |||||||
|         def wrap_class_method(wrapper): |         def wrap_class_method(wrapper): | ||||||
|             try: |             try: | ||||||
|                 orig = getattr(cls, wrapper.__name__).im_func |                 orig = getattr(cls, wrapper.__name__).im_func | ||||||
|             except: |             except Exception: | ||||||
|                 orig = lambda x: None |                 orig = lambda x: None | ||||||
|             setattr(cls, wrapper.__name__, decorator.decorator(wrapper, orig)) |             setattr(cls, wrapper.__name__, decorator.decorator(wrapper, orig)) | ||||||
|  |  | ||||||
|   | |||||||
| @@ -91,6 +91,20 @@ def serializer_proxy(obj_or_type): | |||||||
|             r = SerializerCallProxy(self.__call_queue, attr, self) |             r = SerializerCallProxy(self.__call_queue, attr, self) | ||||||
|             return r |             return r | ||||||
|  |  | ||||||
|  |         # For an interable object, on __iter__(), save the object's | ||||||
|  |         # iterator and return this proxy.  On next(), call the object's | ||||||
|  |         # iterator through this proxy. | ||||||
|  |         def __iter__(self): | ||||||
|  |             attr = getattr(self.__object, "__iter__") | ||||||
|  |             self.__iter = SerializerCallProxy(self.__call_queue, attr, self)() | ||||||
|  |             return self | ||||||
|  |         def next(self): | ||||||
|  |             return SerializerCallProxy(self.__call_queue, | ||||||
|  |                                        self.__iter.next, self)() | ||||||
|  |  | ||||||
|  |         def __getitem__(self, key): | ||||||
|  |             return self.__getattr__("__getitem__")(key) | ||||||
|  |  | ||||||
|         def __call__(self, *args, **kwargs): |         def __call__(self, *args, **kwargs): | ||||||
|             """Call this to instantiate the type, if a type was passed |             """Call this to instantiate the type, if a type was passed | ||||||
|             to serializer_proxy.  Otherwise, pass the call through.""" |             to serializer_proxy.  Otherwise, pass the call through.""" | ||||||
|   | |||||||
							
								
								
									
										18
									
								
								nilmdb/utils/sort.py
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										18
									
								
								nilmdb/utils/sort.py
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,18 @@ | |||||||
|  | import re | ||||||
|  |  | ||||||
|  | def sort_human(items, key = None): | ||||||
|  |     """Human-friendly sort (/stream/2 before /stream/10)""" | ||||||
|  |     def to_num(val): | ||||||
|  |         try: | ||||||
|  |             return int(val) | ||||||
|  |         except Exception: | ||||||
|  |             return val | ||||||
|  |  | ||||||
|  |     def human_key(text): | ||||||
|  |         if key: | ||||||
|  |             text = key(text) | ||||||
|  |         # Break into character and numeric chunks. | ||||||
|  |         chunks = re.split(r'([0-9]+)', text) | ||||||
|  |         return [ to_num(c) for c in chunks ] | ||||||
|  |  | ||||||
|  |     return sorted(items, key = human_key) | ||||||
| @@ -1,9 +1,12 @@ | |||||||
|  | from __future__ import absolute_import | ||||||
|  |  | ||||||
| from nilmdb.utils import datetime_tz | from nilmdb.utils import datetime_tz | ||||||
| import re | import re | ||||||
|  | import time | ||||||
|  |  | ||||||
| # Range | # Range | ||||||
| min_timestamp = (-2**63) | min_timestamp = (-2**63) | ||||||
| max_timestamp = (2**62 - 1) | max_timestamp = (2**63 - 1) | ||||||
|  |  | ||||||
| # Smallest representable step | # Smallest representable step | ||||||
| epsilon = 1 | epsilon = 1 | ||||||
| @@ -29,6 +32,10 @@ def timestamp_to_human(timestamp): | |||||||
|     """Convert a timestamp (integer microseconds since epoch) to a |     """Convert a timestamp (integer microseconds since epoch) to a | ||||||
|     human-readable string, using the local timezone for display |     human-readable string, using the local timezone for display | ||||||
|     (e.g. from the TZ env var).""" |     (e.g. from the TZ env var).""" | ||||||
|  |     if timestamp == min_timestamp: | ||||||
|  |         return "(minimum)" | ||||||
|  |     if timestamp == max_timestamp: | ||||||
|  |         return "(maximum)" | ||||||
|     dt = datetime_tz.datetime_tz.fromtimestamp(timestamp_to_unix(timestamp)) |     dt = datetime_tz.datetime_tz.fromtimestamp(timestamp_to_unix(timestamp)) | ||||||
|     return dt.strftime("%a, %d %b %Y %H:%M:%S.%f %z") |     return dt.strftime("%a, %d %b %Y %H:%M:%S.%f %z") | ||||||
|  |  | ||||||
| @@ -36,6 +43,7 @@ def unix_to_timestamp(unix): | |||||||
|     """Convert a Unix timestamp (floating point seconds since epoch) |     """Convert a Unix timestamp (floating point seconds since epoch) | ||||||
|     into a NILM timestamp (integer microseconds since epoch)""" |     into a NILM timestamp (integer microseconds since epoch)""" | ||||||
|     return int(round(unix * 1e6)) |     return int(round(unix * 1e6)) | ||||||
|  | seconds_to_timestamp = unix_to_timestamp | ||||||
|  |  | ||||||
| def timestamp_to_unix(timestamp): | def timestamp_to_unix(timestamp): | ||||||
|     """Convert a NILM timestamp (integer microseconds since epoch) |     """Convert a NILM timestamp (integer microseconds since epoch) | ||||||
| @@ -52,10 +60,23 @@ def rate_to_period(hz, cycles = 1): | |||||||
| def parse_time(toparse): | def parse_time(toparse): | ||||||
|     """ |     """ | ||||||
|     Parse a free-form time string and return a nilmdb timestamp |     Parse a free-form time string and return a nilmdb timestamp | ||||||
|     (integer seconds since epoch).  If the string doesn't contain a |     (integer microseconds since epoch).  If the string doesn't contain a | ||||||
|     timestamp, the current local timezone is assumed (e.g. from the TZ |     timestamp, the current local timezone is assumed (e.g. from the TZ | ||||||
|     env var). |     env var). | ||||||
|     """ |     """ | ||||||
|  |     if toparse == "min": | ||||||
|  |         return min_timestamp | ||||||
|  |     if toparse == "max": | ||||||
|  |         return max_timestamp | ||||||
|  |  | ||||||
|  |     # If it starts with @, treat it as a NILM timestamp | ||||||
|  |     # (integer microseconds since epoch) | ||||||
|  |     try: | ||||||
|  |         if toparse[0] == '@': | ||||||
|  |             return int(toparse[1:]) | ||||||
|  |     except (ValueError, KeyError, IndexError): | ||||||
|  |         pass | ||||||
|  |  | ||||||
|     # If string isn't "now" and doesn't contain at least 4 digits, |     # If string isn't "now" and doesn't contain at least 4 digits, | ||||||
|     # consider it invalid.  smartparse might otherwise accept |     # consider it invalid.  smartparse might otherwise accept | ||||||
|     # empty strings and strings with just separators. |     # empty strings and strings with just separators. | ||||||
| @@ -69,14 +90,6 @@ def parse_time(toparse): | |||||||
|     except (ValueError, OverflowError): |     except (ValueError, OverflowError): | ||||||
|         pass |         pass | ||||||
|  |  | ||||||
|     # If it starts with @, treat it as a NILM timestamp |  | ||||||
|     # (integer microseconds since epoch) |  | ||||||
|     try: |  | ||||||
|         if toparse[0] == '@': |  | ||||||
|             return int(toparse[1:]) |  | ||||||
|     except (ValueError, KeyError): |  | ||||||
|         pass |  | ||||||
|  |  | ||||||
|     # If it's parseable as a float, treat it as a Unix or NILM |     # If it's parseable as a float, treat it as a Unix or NILM | ||||||
|     # timestamp based on its range. |     # timestamp based on its range. | ||||||
|     try: |     try: | ||||||
| @@ -118,4 +131,4 @@ def parse_time(toparse): | |||||||
|  |  | ||||||
| def now(): | def now(): | ||||||
|     """Return current timestamp""" |     """Return current timestamp""" | ||||||
|     return unix_to_timestamp(datetime_tz.datetime_tz.utcnow().totimestamp()) |     return unix_to_timestamp(time.time()) | ||||||
|   | |||||||
							
								
								
									
										29
									
								
								nilmdb/utils/unicode.py
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										29
									
								
								nilmdb/utils/unicode.py
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,29 @@ | |||||||
|  | import sys | ||||||
|  |  | ||||||
|  | if sys.version_info[0] >= 3: # pragma: no cover (future Python3 compat) | ||||||
|  |     text_type = str | ||||||
|  | else: | ||||||
|  |     text_type = unicode | ||||||
|  |  | ||||||
|  | def encode(u): | ||||||
|  |     """Try to encode something from Unicode to a string using the | ||||||
|  |     default encoding.  If it fails, try encoding as UTF-8.""" | ||||||
|  |     if not isinstance(u, text_type): | ||||||
|  |         return u | ||||||
|  |     try: | ||||||
|  |         return u.encode() | ||||||
|  |     except UnicodeEncodeError: | ||||||
|  |         return u.encode("utf-8") | ||||||
|  |  | ||||||
|  | def decode(s): | ||||||
|  |     """Try to decode someting from string to Unicode using the | ||||||
|  |     default encoding.  If it fails, try decoding as UTF-8.""" | ||||||
|  |     if isinstance(s, text_type): | ||||||
|  |         return s | ||||||
|  |     try: | ||||||
|  |         return s.decode() | ||||||
|  |     except UnicodeDecodeError: | ||||||
|  |         try: | ||||||
|  |             return s.decode("utf-8") | ||||||
|  |         except UnicodeDecodeError: | ||||||
|  |             return s # best we can do | ||||||
							
								
								
									
										8
									
								
								setup.py
									
									
									
									
									
								
							
							
						
						
									
										8
									
								
								setup.py
									
									
									
									
									
								
							| @@ -39,11 +39,10 @@ versioneer.parentdir_prefix = 'nilmdb-' | |||||||
| # Hack to workaround logging/multiprocessing issue: | # Hack to workaround logging/multiprocessing issue: | ||||||
| # https://groups.google.com/d/msg/nose-users/fnJ-kAUbYHQ/_UsLN786ygcJ | # https://groups.google.com/d/msg/nose-users/fnJ-kAUbYHQ/_UsLN786ygcJ | ||||||
| try: import multiprocessing | try: import multiprocessing | ||||||
| except: pass | except Exception: pass | ||||||
|  |  | ||||||
| # Use Cython if it's new enough, otherwise use preexisting C files. | # Use Cython if it's new enough, otherwise use preexisting C files. | ||||||
| cython_modules = [ 'nilmdb.server.interval', | cython_modules = [ 'nilmdb.server.interval', | ||||||
|                    'nilmdb.server.layout', |  | ||||||
|                    'nilmdb.server.rbtree' ] |                    'nilmdb.server.rbtree' ] | ||||||
| try: | try: | ||||||
|     import Cython |     import Cython | ||||||
| @@ -108,17 +107,18 @@ setup(name='nilmdb', | |||||||
|       author_email = 'jim@jtan.com', |       author_email = 'jim@jtan.com', | ||||||
|       tests_require = [ 'nose', |       tests_require = [ 'nose', | ||||||
|                         'coverage', |                         'coverage', | ||||||
|  |                         'numpy', | ||||||
|                         ], |                         ], | ||||||
|       setup_requires = [ 'distribute', |       setup_requires = [ 'distribute', | ||||||
|                          ], |                          ], | ||||||
|       install_requires = [ 'decorator', |       install_requires = [ 'decorator', | ||||||
|                            'cherrypy >= 3.2', |                            'cherrypy >= 3.2', | ||||||
|                            'simplejson', |                            'simplejson', | ||||||
|                            'pycurl', |  | ||||||
|                            'python-dateutil', |                            'python-dateutil', | ||||||
|                            'pytz', |                            'pytz', | ||||||
|                            'psutil >= 0.3.0', |                            'psutil >= 0.3.0', | ||||||
|                            'requests >= 1.1.0, < 2.0.0', |                            'requests >= 1.1.0, < 2.0.0', | ||||||
|  |                            'progressbar >= 2.2', | ||||||
|                            ], |                            ], | ||||||
|       packages = [ 'nilmdb', |       packages = [ 'nilmdb', | ||||||
|                    'nilmdb.utils', |                    'nilmdb.utils', | ||||||
| @@ -127,11 +127,13 @@ setup(name='nilmdb', | |||||||
|                    'nilmdb.client', |                    'nilmdb.client', | ||||||
|                    'nilmdb.cmdline', |                    'nilmdb.cmdline', | ||||||
|                    'nilmdb.scripts', |                    'nilmdb.scripts', | ||||||
|  |                    'nilmdb.fsck', | ||||||
|                    ], |                    ], | ||||||
|       entry_points = { |       entry_points = { | ||||||
|           'console_scripts': [ |           'console_scripts': [ | ||||||
|               'nilmtool = nilmdb.scripts.nilmtool:main', |               'nilmtool = nilmdb.scripts.nilmtool:main', | ||||||
|               'nilmdb-server = nilmdb.scripts.nilmdb_server:main', |               'nilmdb-server = nilmdb.scripts.nilmdb_server:main', | ||||||
|  |               'nilmdb-fsck = nilmdb.scripts.nilmdb_fsck:main', | ||||||
|               ], |               ], | ||||||
|           }, |           }, | ||||||
|       ext_modules = ext_modules, |       ext_modules = ext_modules, | ||||||
|   | |||||||
							
								
								
									
										28
									
								
								tests/data/extract-8
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										28
									
								
								tests/data/extract-8
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,28 @@ | |||||||
|  | # interval-start 1332496919900000 | ||||||
|  | 1332496919900000 2.523050e+05 2.254020e+05 4.779410e+03 3.638030e+03 8.138070e+03 4.334460e+03 1.083780e+03 3.743730e+03 | ||||||
|  | 1332496919908333 2.551190e+05 2.237870e+05 5.965640e+03 2.076350e+03 9.468790e+03 3.693880e+03 1.247860e+03 3.393680e+03 | ||||||
|  | 1332496919916667 2.616370e+05 2.247980e+05 4.848970e+03 2.315620e+03 9.323300e+03 4.225460e+03 1.805780e+03 2.593050e+03 | ||||||
|  | 1332496919925000 2.606460e+05 2.251300e+05 3.061360e+03 3.951840e+03 7.662910e+03 5.341410e+03 1.986520e+03 2.276780e+03 | ||||||
|  | 1332496919933333 2.559710e+05 2.235030e+05 4.096030e+03 3.296970e+03 7.827080e+03 5.452120e+03 2.492520e+03 2.929450e+03 | ||||||
|  | 1332496919941667 2.579260e+05 2.217080e+05 5.472320e+03 1.555700e+03 8.495760e+03 4.491140e+03 2.379780e+03 3.741710e+03 | ||||||
|  | 1332496919950000 2.610180e+05 2.242350e+05 4.669770e+03 1.876190e+03 8.366680e+03 3.677510e+03 9.021690e+02 3.549040e+03 | ||||||
|  | 1332496919958333 2.569150e+05 2.274650e+05 2.785070e+03 3.751930e+03 7.440320e+03 3.964860e+03 -3.227860e+02 2.460890e+03 | ||||||
|  | 1332496919966667 2.509510e+05 2.262000e+05 3.772710e+03 3.131950e+03 8.159860e+03 4.539860e+03 7.375190e+02 2.126750e+03 | ||||||
|  | 1332496919975000 2.556710e+05 2.223720e+05 5.826200e+03 8.715560e+02 9.120240e+03 4.545110e+03 2.804310e+03 2.721000e+03 | ||||||
|  | 1332496919983333 2.649730e+05 2.214860e+05 5.839130e+03 4.659180e+02 8.628300e+03 3.934870e+03 2.972490e+03 3.773730e+03 | ||||||
|  | 1332496919991667 2.652170e+05 2.233920e+05 3.718770e+03 2.834970e+03 7.209900e+03 3.460260e+03 1.324930e+03 4.075960e+03 | ||||||
|  | # interval-end 1332496919991668 | ||||||
|  | # interval-start 1332496920000000 | ||||||
|  | 1332496920000000 2.564370e+05 2.244300e+05 4.011610e+03 3.475340e+03 7.495890e+03 3.388940e+03 2.613970e+02 3.731260e+03 | ||||||
|  | 1332496920008333 2.539630e+05 2.241670e+05 5.621070e+03 1.548010e+03 9.165170e+03 3.522930e+03 1.058930e+03 2.996960e+03 | ||||||
|  | 1332496920016667 2.585080e+05 2.249300e+05 6.011400e+03 8.188660e+02 9.039950e+03 4.482440e+03 2.490390e+03 2.679340e+03 | ||||||
|  | 1332496920025000 2.596270e+05 2.260220e+05 4.474500e+03 2.423020e+03 7.414190e+03 5.071970e+03 2.439380e+03 2.962960e+03 | ||||||
|  | 1332496920033333 2.551870e+05 2.246320e+05 4.738570e+03 3.398040e+03 7.395120e+03 4.726450e+03 1.839030e+03 3.393530e+03 | ||||||
|  | 1332496920041667 2.571020e+05 2.216230e+05 6.144130e+03 1.441090e+03 8.756480e+03 3.495320e+03 1.869940e+03 3.752530e+03 | ||||||
|  | 1332496920050000 2.636530e+05 2.217700e+05 6.221770e+03 7.389620e+02 9.547600e+03 2.666820e+03 1.462660e+03 3.332570e+03 | ||||||
|  | 1332496920058333 2.636130e+05 2.252560e+05 4.477120e+03 2.437450e+03 8.510210e+03 3.855630e+03 9.594420e+02 2.387180e+03 | ||||||
|  | 1332496920066667 2.553500e+05 2.262640e+05 4.283720e+03 3.923940e+03 7.912470e+03 5.466520e+03 1.284990e+03 2.093720e+03 | ||||||
|  | 1332496920075000 2.527270e+05 2.246090e+05 5.851930e+03 2.491980e+03 8.540630e+03 5.623050e+03 2.339780e+03 3.007140e+03 | ||||||
|  | 1332496920083333 2.584750e+05 2.235780e+05 5.924870e+03 1.394480e+03 8.779620e+03 4.544180e+03 2.132030e+03 3.849760e+03 | ||||||
|  | 1332496920091667 2.615630e+05 2.246090e+05 4.336140e+03 2.455750e+03 8.055380e+03 3.469110e+03 6.278730e+02 3.664200e+03 | ||||||
|  | # interval-end 1332496920100000 | ||||||
							
								
								
									
										8
									
								
								tests/data/timestamped
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										8
									
								
								tests/data/timestamped
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,8 @@ | |||||||
|  | -10000000000 2.61246e+05  2.22735e+05  4.60340e+03  2.58221e+03  8.42804e+03  3.41890e+03  9.57898e+02  4.00585e+03   | ||||||
|  | -100000000 2.61246e+05  2.22735e+05  4.60340e+03  2.58221e+03  8.42804e+03  3.41890e+03  9.57898e+02  4.00585e+03   | ||||||
|  | -100000 2.61246e+05  2.22735e+05  4.60340e+03  2.58221e+03  8.42804e+03  3.41890e+03  9.57898e+02  4.00585e+03   | ||||||
|  | -1000 2.61246e+05  2.22735e+05  4.60340e+03  2.58221e+03  8.42804e+03  3.41890e+03  9.57898e+02  4.00585e+03   | ||||||
|  | 1 2.61246e+05  2.22735e+05  4.60340e+03  2.58221e+03  8.42804e+03  3.41890e+03  9.57898e+02  4.00585e+03   | ||||||
|  | 1000 2.61246e+05  2.22735e+05  4.60340e+03  2.58221e+03  8.42804e+03  3.41890e+03  9.57898e+02  4.00585e+03   | ||||||
|  | 1000000 2.61246e+05  2.22735e+05  4.60340e+03  2.58221e+03  8.42804e+03  3.41890e+03  9.57898e+02  4.00585e+03   | ||||||
|  | 1000000000 2.61246e+05  2.22735e+05  4.60340e+03  2.58221e+03  8.42804e+03  3.41890e+03  9.57898e+02  4.00585e+03   | ||||||
| @@ -24,7 +24,7 @@ class JimOrderPlugin(nose.plugins.Plugin): | |||||||
|                     name, workingDir=loader.workingDir) |                     name, workingDir=loader.workingDir) | ||||||
|                 try: |                 try: | ||||||
|                     order = os.path.join(addr.filename, "test.order") |                     order = os.path.join(addr.filename, "test.order") | ||||||
|                 except: |                 except Exception: | ||||||
|                     order = None |                     order = None | ||||||
|                 if order and os.path.exists(order): |                 if order and os.path.exists(order): | ||||||
|                     files = [] |                     files = [] | ||||||
|   | |||||||
| @@ -4,16 +4,15 @@ test_lrucache.py | |||||||
| test_mustclose.py | test_mustclose.py | ||||||
|  |  | ||||||
| test_serializer.py | test_serializer.py | ||||||
| test_iteratorizer.py |  | ||||||
|  |  | ||||||
| test_timestamper.py | test_timestamper.py | ||||||
| test_layout.py |  | ||||||
| test_rbtree.py | test_rbtree.py | ||||||
| test_interval.py | test_interval.py | ||||||
|  |  | ||||||
| test_bulkdata.py | test_bulkdata.py | ||||||
| test_nilmdb.py | test_nilmdb.py | ||||||
| test_client.py | test_client.py | ||||||
|  | test_numpyclient.py | ||||||
| test_cmdline.py | test_cmdline.py | ||||||
|  |  | ||||||
| test_*.py | test_*.py | ||||||
|   | |||||||
| @@ -30,6 +30,11 @@ class TestBulkData(object): | |||||||
|         else: |         else: | ||||||
|             data = BulkData(db, file_size = size, files_per_dir = files) |             data = BulkData(db, file_size = size, files_per_dir = files) | ||||||
|  |  | ||||||
|  |         # Try opening it again (should result in locking error) | ||||||
|  |         with assert_raises(IOError) as e: | ||||||
|  |             data2 = BulkData(db) | ||||||
|  |         in_("already locked by another process", str(e.exception)) | ||||||
|  |  | ||||||
|         # create empty |         # create empty | ||||||
|         with assert_raises(ValueError): |         with assert_raises(ValueError): | ||||||
|             data.create("/foo", "uint16_8") |             data.create("/foo", "uint16_8") | ||||||
| @@ -64,9 +69,9 @@ class TestBulkData(object): | |||||||
|         raw = [] |         raw = [] | ||||||
|         for i in range(1000): |         for i in range(1000): | ||||||
|             raw.append("%d 1 2 3 4 5 6 7 8\n" % (10000 + i)) |             raw.append("%d 1 2 3 4 5 6 7 8\n" % (10000 + i)) | ||||||
|         node.append_string("".join(raw[0:1]), 0, 50000) |         node.append_data("".join(raw[0:1]), 0, 50000) | ||||||
|         node.append_string("".join(raw[1:100]), 0, 50000) |         node.append_data("".join(raw[1:100]), 0, 50000) | ||||||
|         node.append_string("".join(raw[100:]), 0, 50000) |         node.append_data("".join(raw[100:]), 0, 50000) | ||||||
|  |  | ||||||
|         misc_slices = [ 0, 100, slice(None), slice(0), slice(10), |         misc_slices = [ 0, 100, slice(None), slice(0), slice(10), | ||||||
|                         slice(5,10), slice(3,None), slice(3,-3), |                         slice(5,10), slice(3,None), slice(3,-3), | ||||||
| @@ -80,7 +85,7 @@ class TestBulkData(object): | |||||||
|         # Extract misc slices while appending, to make sure the |         # Extract misc slices while appending, to make sure the | ||||||
|         # data isn't being added in the middle of the file |         # data isn't being added in the middle of the file | ||||||
|         for s in [2, slice(1,5), 2, slice(1,5)]: |         for s in [2, slice(1,5), 2, slice(1,5)]: | ||||||
|             node.append_string("0 0 0 0 0 0 0 0 0\n", 0, 50000) |             node.append_data("0 0 0 0 0 0 0 0 0\n", 0, 50000) | ||||||
|             raw.append("0 0 0 0 0 0 0 0 0\n") |             raw.append("0 0 0 0 0 0 0 0 0\n") | ||||||
|             eq_(get_node_slice(s), raw[s]) |             eq_(get_node_slice(s), raw[s]) | ||||||
|  |  | ||||||
|   | |||||||
| @@ -23,6 +23,7 @@ import warnings | |||||||
| import resource | import resource | ||||||
| import time | import time | ||||||
| import re | import re | ||||||
|  | import struct | ||||||
|  |  | ||||||
| from testutil.helpers import * | from testutil.helpers import * | ||||||
|  |  | ||||||
| @@ -104,16 +105,19 @@ class TestClient(object): | |||||||
|                 client.http.post("/stream/list") |                 client.http.post("/stream/list") | ||||||
|         client = nilmdb.client.Client(url = testurl) |         client = nilmdb.client.Client(url = testurl) | ||||||
|  |  | ||||||
|         # Create three streams |         # Create four streams | ||||||
|         client.stream_create("/newton/prep", "float32_8") |         client.stream_create("/newton/prep", "float32_8") | ||||||
|         client.stream_create("/newton/raw", "uint16_6") |         client.stream_create("/newton/raw", "uint16_6") | ||||||
|         client.stream_create("/newton/zzz/rawnotch", "uint16_9") |         client.stream_create("/newton/zzz/rawnotch2", "uint16_9") | ||||||
|  |         client.stream_create("/newton/zzz/rawnotch11", "uint16_9") | ||||||
|  |  | ||||||
|         # Verify we got 3 streams |         # Verify we got 4 streams in the right order | ||||||
|         eq_(client.stream_list(), [ ["/newton/prep", "float32_8"], |         eq_(client.stream_list(), [ ["/newton/prep", "float32_8"], | ||||||
|                                     ["/newton/raw", "uint16_6"], |                                     ["/newton/raw", "uint16_6"], | ||||||
|                                     ["/newton/zzz/rawnotch", "uint16_9"] |                                     ["/newton/zzz/rawnotch2", "uint16_9"], | ||||||
|  |                                     ["/newton/zzz/rawnotch11", "uint16_9"] | ||||||
|                                     ]) |                                     ]) | ||||||
|  |  | ||||||
|         # Match just one type or one path |         # Match just one type or one path | ||||||
|         eq_(client.stream_list(layout="uint16_6"), |         eq_(client.stream_list(layout="uint16_6"), | ||||||
|             [ ["/newton/raw", "uint16_6"] ]) |             [ ["/newton/raw", "uint16_6"] ]) | ||||||
| @@ -238,6 +242,35 @@ class TestClient(object): | |||||||
|         in_("400 Bad Request", str(e.exception)) |         in_("400 Bad Request", str(e.exception)) | ||||||
|         in_("start must precede end", str(e.exception)) |         in_("start must precede end", str(e.exception)) | ||||||
|  |  | ||||||
|  |         # Invalid times in HTTP request | ||||||
|  |         with assert_raises(ClientError) as e: | ||||||
|  |             client.http.put("stream/insert", "", { "path": "/newton/prep", | ||||||
|  |                                                    "start": "asdf", "end": 0 }) | ||||||
|  |         in_("400 Bad Request", str(e.exception)) | ||||||
|  |         in_("invalid start", str(e.exception)) | ||||||
|  |  | ||||||
|  |         with assert_raises(ClientError) as e: | ||||||
|  |             client.http.put("stream/insert", "", { "path": "/newton/prep", | ||||||
|  |                                                    "start": 0, "end": "asdf" }) | ||||||
|  |         in_("400 Bad Request", str(e.exception)) | ||||||
|  |         in_("invalid end", str(e.exception)) | ||||||
|  |  | ||||||
|  |         # Good content type | ||||||
|  |         with assert_raises(ClientError) as e: | ||||||
|  |             client.http.put("stream/insert", "", | ||||||
|  |                             { "path": "xxxx", "start": 0, "end": 1, | ||||||
|  |                               "binary": 1 }, | ||||||
|  |                             binary = True) | ||||||
|  |         in_("No such stream", str(e.exception)) | ||||||
|  |  | ||||||
|  |         # Bad content type | ||||||
|  |         with assert_raises(ClientError) as e: | ||||||
|  |             client.http.put("stream/insert", "", | ||||||
|  |                             { "path": "xxxx", "start": 0, "end": 1, | ||||||
|  |                               "binary": 1 }, | ||||||
|  |                             binary = False) | ||||||
|  |         in_("Content type must be application/octet-stream", str(e.exception)) | ||||||
|  |  | ||||||
|         # Specify start/end (starts too late) |         # Specify start/end (starts too late) | ||||||
|         data = timestamper.TimestamperRate(testfile, start, 120) |         data = timestamper.TimestamperRate(testfile, start, 120) | ||||||
|         with assert_raises(ClientError) as e: |         with assert_raises(ClientError) as e: | ||||||
| @@ -293,6 +326,27 @@ class TestClient(object): | |||||||
|         # Test count |         # Test count | ||||||
|         eq_(client.stream_count("/newton/prep"), 14400) |         eq_(client.stream_count("/newton/prep"), 14400) | ||||||
|  |  | ||||||
|  |         # Test binary output | ||||||
|  |         with assert_raises(ClientError) as e: | ||||||
|  |             list(client.stream_extract("/newton/prep", | ||||||
|  |                                        markup = True, binary = True)) | ||||||
|  |         with assert_raises(ClientError) as e: | ||||||
|  |             list(client.stream_extract("/newton/prep", | ||||||
|  |                                        count = True, binary = True)) | ||||||
|  |         data = "".join(client.stream_extract("/newton/prep", binary = True)) | ||||||
|  |         # Quick check using struct | ||||||
|  |         unpacker = struct.Struct("<qffffffff") | ||||||
|  |         out = [] | ||||||
|  |         for i in range(14400): | ||||||
|  |             out.append(unpacker.unpack_from(data, i * unpacker.size)) | ||||||
|  |         eq_(out[0], (1332511200000000, 266568.0, 224029.0, 5161.39990234375, | ||||||
|  |                      2525.169921875, 8350.83984375, 3724.699951171875, | ||||||
|  |                      1355.3399658203125, 2039.0)) | ||||||
|  |  | ||||||
|  |         # Just get some coverage | ||||||
|  |         with assert_raises(ClientError) as e: | ||||||
|  |             client.http.post("/stream/remove", { "path": "/none" }) | ||||||
|  |  | ||||||
|         client.close() |         client.close() | ||||||
|  |  | ||||||
|     def test_client_06_generators(self): |     def test_client_06_generators(self): | ||||||
| @@ -311,11 +365,7 @@ class TestClient(object): | |||||||
|  |  | ||||||
|         # Trigger a curl error in generator |         # Trigger a curl error in generator | ||||||
|         with assert_raises(ServerError) as e: |         with assert_raises(ServerError) as e: | ||||||
|             client.http.get_gen("http://nosuchurl/").next() |             client.http.get_gen("http://nosuchurl.example.com./").next() | ||||||
|  |  | ||||||
|         # Trigger a curl error in generator |  | ||||||
|         with assert_raises(ServerError) as e: |  | ||||||
|             client.http.get_gen("http://nosuchurl/").next() |  | ||||||
|  |  | ||||||
|         # Check 404 for missing streams |         # Check 404 for missing streams | ||||||
|         for function in [ client.stream_intervals, client.stream_extract ]: |         for function in [ client.stream_intervals, client.stream_extract ]: | ||||||
| @@ -355,16 +405,38 @@ class TestClient(object): | |||||||
|                                  headers()) |                                  headers()) | ||||||
|  |  | ||||||
|         # Extract |         # Extract | ||||||
|         x = http.get("stream/extract", |         x = http.get("stream/extract", { "path": "/newton/prep", | ||||||
|                             { "path": "/newton/prep", |                                          "start": "123", "end": "124" }) | ||||||
|                               "start": "123", |  | ||||||
|                               "end": "124" }) |  | ||||||
|         if "transfer-encoding: chunked" not in headers(): |         if "transfer-encoding: chunked" not in headers(): | ||||||
|             warnings.warn("Non-chunked HTTP response for /stream/extract") |             warnings.warn("Non-chunked HTTP response for /stream/extract") | ||||||
|         if "content-type: text/plain;charset=utf-8" not in headers(): |         if "content-type: text/plain;charset=utf-8" not in headers(): | ||||||
|             raise AssertionError("/stream/extract is not text/plain:\n" + |             raise AssertionError("/stream/extract is not text/plain:\n" + | ||||||
|                                  headers()) |                                  headers()) | ||||||
|  |  | ||||||
|  |         x = http.get("stream/extract", { "path": "/newton/prep", | ||||||
|  |                                          "start": "123", "end": "124", | ||||||
|  |                                          "binary": "1" }) | ||||||
|  |         if "transfer-encoding: chunked" not in headers(): | ||||||
|  |             warnings.warn("Non-chunked HTTP response for /stream/extract") | ||||||
|  |         if "content-type: application/octet-stream" not in headers(): | ||||||
|  |             raise AssertionError("/stream/extract is not binary:\n" + | ||||||
|  |                                  headers()) | ||||||
|  |  | ||||||
|  |         # Make sure a binary of "0" is really off | ||||||
|  |         x = http.get("stream/extract", { "path": "/newton/prep", | ||||||
|  |                                          "start": "123", "end": "124", | ||||||
|  |                                          "binary": "0" }) | ||||||
|  |         if "content-type: application/octet-stream" in headers(): | ||||||
|  |                     raise AssertionError("/stream/extract is not text:\n" + | ||||||
|  |                                          headers()) | ||||||
|  |  | ||||||
|  |         # Invalid parameters | ||||||
|  |         with assert_raises(ClientError) as e: | ||||||
|  |             x = http.get("stream/extract", { "path": "/newton/prep", | ||||||
|  |                                              "start": "123", "end": "124", | ||||||
|  |                                              "binary": "asdfasfd" }) | ||||||
|  |         in_("can't parse parameter", str(e.exception)) | ||||||
|  |  | ||||||
|         client.close() |         client.close() | ||||||
|  |  | ||||||
|     def test_client_08_unicode(self): |     def test_client_08_unicode(self): | ||||||
| @@ -375,6 +447,7 @@ class TestClient(object): | |||||||
|  |  | ||||||
|             # Delete streams that exist |             # Delete streams that exist | ||||||
|             for stream in client.stream_list(): |             for stream in client.stream_list(): | ||||||
|  |                 client.stream_remove(stream[0]) | ||||||
|                 client.stream_destroy(stream[0]) |                 client.stream_destroy(stream[0]) | ||||||
|  |  | ||||||
|             # Database is empty |             # Database is empty | ||||||
| @@ -440,72 +513,80 @@ class TestClient(object): | |||||||
|             # override _max_data to trigger frequent server updates |             # override _max_data to trigger frequent server updates | ||||||
|             ctx._max_data = 15 |             ctx._max_data = 15 | ||||||
|  |  | ||||||
|             ctx.insert("100 1\n") |             ctx.insert("1000 1\n") | ||||||
|  |  | ||||||
|             ctx.insert("101 ") |             ctx.insert("1010 ") | ||||||
|             ctx.insert("1\n102 1") |             ctx.insert("1\n1020 1") | ||||||
|             ctx.insert("") |             ctx.insert("") | ||||||
|             ctx.insert("\n103 1\n") |             ctx.insert("\n1030 1\n") | ||||||
|  |  | ||||||
|             ctx.insert("104 1\n") |             ctx.insert("1040 1\n") | ||||||
|             ctx.insert("# hello\n") |             ctx.insert("# hello\n") | ||||||
|             ctx.insert("   # hello\n") |             ctx.insert("   # hello\n") | ||||||
|             ctx.insert("  105 1\n") |             ctx.insert("  1050 1\n") | ||||||
|             ctx.finalize() |             ctx.finalize() | ||||||
|  |  | ||||||
|             ctx.insert("107 1\n") |             ctx.insert("1070 1\n") | ||||||
|             ctx.update_end(108) |             ctx.update_end(1080) | ||||||
|             ctx.finalize() |             ctx.finalize() | ||||||
|             ctx.update_start(109) |             ctx.update_start(1090) | ||||||
|             ctx.insert("110 1\n") |             ctx.insert("1100 1\n") | ||||||
|             ctx.insert("111 1\n") |             ctx.insert("1110 1\n") | ||||||
|             ctx.insert("112 1\n") |             ctx.send() | ||||||
|             ctx.insert("113 1\n") |             ctx.insert("1120 1\n") | ||||||
|             ctx.insert("114 1\n") |             ctx.insert("1130 1\n") | ||||||
|             ctx.update_end(116) |             ctx.insert("1140 1\n") | ||||||
|             ctx.insert("115 1\n") |             ctx.update_end(1160) | ||||||
|             ctx.update_end(117) |             ctx.insert("1150 1\n") | ||||||
|             ctx.insert("116 1\n") |             ctx.update_end(1170) | ||||||
|             ctx.update_end(118) |             ctx.insert("1160 1\n") | ||||||
|             ctx.insert("117 1" + |             ctx.update_end(1180) | ||||||
|  |             ctx.insert("1170 1" + | ||||||
|                        " # this is super long" * 100 + |                        " # this is super long" * 100 + | ||||||
|                        "\n") |                        "\n") | ||||||
|             ctx.finalize() |             ctx.finalize() | ||||||
|             ctx.insert("# this is super long" * 100) |             ctx.insert("# this is super long" * 100) | ||||||
|  |  | ||||||
|         with assert_raises(ClientError): |         with assert_raises(ClientError): | ||||||
|             with client.stream_insert_context("/context/test", 100, 200) as ctx: |             with client.stream_insert_context("/context/test", | ||||||
|                 ctx.insert("118 1\n") |                                               1000, 2000) as ctx: | ||||||
|  |                 ctx.insert("1180 1\n") | ||||||
|  |  | ||||||
|         with assert_raises(ClientError): |         with assert_raises(ClientError): | ||||||
|             with client.stream_insert_context("/context/test", 200, 300) as ctx: |             with client.stream_insert_context("/context/test", | ||||||
|                 ctx.insert("118 1\n") |                                               2000, 3000) as ctx: | ||||||
|  |                 ctx.insert("1180 1\n") | ||||||
|  |  | ||||||
|         with assert_raises(ClientError): |         with assert_raises(ClientError): | ||||||
|             with client.stream_insert_context("/context/test") as ctx: |             with client.stream_insert_context("/context/test") as ctx: | ||||||
|                 ctx.insert("bogus data\n") |                 ctx.insert("bogus data\n") | ||||||
|  |  | ||||||
|         with client.stream_insert_context("/context/test", 200, 300) as ctx: |         with client.stream_insert_context("/context/test", 2000, 3000) as ctx: | ||||||
|             # make sure our override wasn't permanent |             # make sure our override wasn't permanent | ||||||
|             ne_(ctx._max_data, 15) |             ne_(ctx._max_data, 15) | ||||||
|             ctx.insert("225 1\n") |             ctx.insert("2250 1\n") | ||||||
|             ctx.finalize() |             ctx.finalize() | ||||||
|  |  | ||||||
|         with assert_raises(ClientError): |         with assert_raises(ClientError): | ||||||
|             with client.stream_insert_context("/context/test", 300, 400) as ctx: |             with client.stream_insert_context("/context/test", | ||||||
|                 ctx.insert("301 1\n") |                                               3000, 4000) as ctx: | ||||||
|                 ctx.insert("302 2\n") |                 ctx.insert("3010 1\n") | ||||||
|                 ctx.insert("303 3\n") |                 ctx.insert("3020 2\n") | ||||||
|                 ctx.insert("304 4\n") |                 ctx.insert("3030 3\n") | ||||||
|                 ctx.insert("304 4\n") # non-monotonic after a few lines |                 ctx.insert("3040 4\n") | ||||||
|  |                 ctx.insert("3040 4\n") # non-monotonic after a few lines | ||||||
|                 ctx.finalize() |                 ctx.finalize() | ||||||
|  |  | ||||||
|         eq_(list(client.stream_intervals("/context/test")), |         eq_(list(client.stream_intervals("/context/test")), | ||||||
|             [ [ 100, 106 ], |             [ [ 1000, 1051 ], | ||||||
|               [ 107, 108 ], |               [ 1070, 1080 ], | ||||||
|               [ 109, 118 ], |               [ 1090, 1180 ], | ||||||
|               [ 200, 300 ] ]) |               [ 2000, 3000 ] ]) | ||||||
|  |  | ||||||
|  |         # destroy stream (try without removing data first) | ||||||
|  |         with assert_raises(ClientError): | ||||||
|  |             client.stream_destroy("/context/test") | ||||||
|  |         client.stream_remove("/context/test") | ||||||
|         client.stream_destroy("/context/test") |         client.stream_destroy("/context/test") | ||||||
|         client.close() |         client.close() | ||||||
|  |  | ||||||
| @@ -559,8 +640,12 @@ class TestClient(object): | |||||||
|         with client.stream_insert_context("/empty/test", end = 950): |         with client.stream_insert_context("/empty/test", end = 950): | ||||||
|             pass |             pass | ||||||
|  |  | ||||||
|  |         # Equal start and end is OK as long as there's no data | ||||||
|  |         with client.stream_insert_context("/empty/test", start=9, end=9): | ||||||
|  |             pass | ||||||
|  |  | ||||||
|         # Try various things that might cause problems |         # Try various things that might cause problems | ||||||
|         with client.stream_insert_context("/empty/test", 1000, 1050): |         with client.stream_insert_context("/empty/test", 1000, 1050) as ctx: | ||||||
|             ctx.finalize() # inserts [1000, 1050] |             ctx.finalize() # inserts [1000, 1050] | ||||||
|             ctx.finalize() # nothing |             ctx.finalize() # nothing | ||||||
|             ctx.finalize() # nothing |             ctx.finalize() # nothing | ||||||
| @@ -600,6 +685,7 @@ class TestClient(object): | |||||||
|                      ]) |                      ]) | ||||||
|  |  | ||||||
|         # Clean up |         # Clean up | ||||||
|  |         client.stream_remove("/empty/test") | ||||||
|         client.stream_destroy("/empty/test") |         client.stream_destroy("/empty/test") | ||||||
|         client.close() |         client.close() | ||||||
|  |  | ||||||
| @@ -613,7 +699,7 @@ class TestClient(object): | |||||||
|                     poolmanager = c.http._last_response.connection.poolmanager |                     poolmanager = c.http._last_response.connection.poolmanager | ||||||
|                     pool = poolmanager.pools[('http','localhost',32180)] |                     pool = poolmanager.pools[('http','localhost',32180)] | ||||||
|                     return (pool.num_connections, pool.num_requests) |                     return (pool.num_connections, pool.num_requests) | ||||||
|                 except: |                 except Exception: | ||||||
|                     raise SkipTest("can't get connection info") |                     raise SkipTest("can't get connection info") | ||||||
|  |  | ||||||
|             # First request makes a connection |             # First request makes a connection | ||||||
| @@ -635,8 +721,9 @@ class TestClient(object): | |||||||
|             eq_(connections(), (1, 5)) |             eq_(connections(), (1, 5)) | ||||||
|  |  | ||||||
|             # Clean up |             # Clean up | ||||||
|  |             c.stream_remove("/persist/test") | ||||||
|             c.stream_destroy("/persist/test") |             c.stream_destroy("/persist/test") | ||||||
|             eq_(connections(), (1, 6)) |             eq_(connections(), (1, 7)) | ||||||
|  |  | ||||||
|     def test_client_13_timestamp_rounding(self): |     def test_client_13_timestamp_rounding(self): | ||||||
|         # Test potentially bad timestamps (due to floating point |         # Test potentially bad timestamps (due to floating point | ||||||
| @@ -661,5 +748,6 @@ class TestClient(object): | |||||||
|                 # Server will round this and give an error on finalize() |                 # Server will round this and give an error on finalize() | ||||||
|                 ctx.insert("299999999.99 1\n") |                 ctx.insert("299999999.99 1\n") | ||||||
|  |  | ||||||
|  |         client.stream_remove("/rounding/test") | ||||||
|         client.stream_destroy("/rounding/test") |         client.stream_destroy("/rounding/test") | ||||||
|         client.close() |         client.close() | ||||||
|   | |||||||
| @@ -21,12 +21,13 @@ from testutil.helpers import * | |||||||
|  |  | ||||||
| testdb = "tests/cmdline-testdb" | testdb = "tests/cmdline-testdb" | ||||||
|  |  | ||||||
| def server_start(max_results = None, bulkdata_args = {}): | def server_start(max_results = None, max_removals = None, bulkdata_args = {}): | ||||||
|     global test_server, test_db |     global test_server, test_db | ||||||
|     # Start web app on a custom port |     # Start web app on a custom port | ||||||
|     test_db = nilmdb.utils.serializer_proxy(nilmdb.server.NilmDB)( |     test_db = nilmdb.utils.serializer_proxy(nilmdb.server.NilmDB)( | ||||||
|         testdb, |         testdb, | ||||||
|         max_results = max_results, |         max_results = max_results, | ||||||
|  |         max_removals = max_removals, | ||||||
|         bulkdata_args = bulkdata_args) |         bulkdata_args = bulkdata_args) | ||||||
|     test_server = nilmdb.server.Server(test_db, host = "127.0.0.1", |     test_server = nilmdb.server.Server(test_db, host = "127.0.0.1", | ||||||
|                                        port = 32180, stoppable = False, |                                        port = 32180, stoppable = False, | ||||||
| @@ -58,8 +59,7 @@ class TestCmdline(object): | |||||||
|  |  | ||||||
|     def run(self, arg_string, infile=None, outfile=None): |     def run(self, arg_string, infile=None, outfile=None): | ||||||
|         """Run a cmdline client with the specified argument string, |         """Run a cmdline client with the specified argument string, | ||||||
|         passing the given input.  Returns a tuple with the output and |         passing the given input.  Save the output and exit code.""" | ||||||
|         exit code""" |  | ||||||
|         # printf("TZ=UTC ./nilmtool.py %s\n", arg_string) |         # printf("TZ=UTC ./nilmtool.py %s\n", arg_string) | ||||||
|         os.environ['NILMDB_URL'] = "http://localhost:32180/" |         os.environ['NILMDB_URL'] = "http://localhost:32180/" | ||||||
|         class stdio_wrapper: |         class stdio_wrapper: | ||||||
| @@ -87,7 +87,7 @@ class TestCmdline(object): | |||||||
|                 sys.exit(0) |                 sys.exit(0) | ||||||
|             except SystemExit as e: |             except SystemExit as e: | ||||||
|                 exitcode = e.code |                 exitcode = e.code | ||||||
|         captured = outfile.getvalue() |         captured = nilmdb.utils.unicode.decode(outfile.getvalue()) | ||||||
|         self.captured = captured |         self.captured = captured | ||||||
|         self.exitcode = exitcode |         self.exitcode = exitcode | ||||||
|  |  | ||||||
| @@ -159,6 +159,12 @@ class TestCmdline(object): | |||||||
|         self.ok("--help") |         self.ok("--help") | ||||||
|         self.contain("usage:") |         self.contain("usage:") | ||||||
|  |  | ||||||
|  |         # help | ||||||
|  |         self.ok("--version") | ||||||
|  |         ver = self.captured | ||||||
|  |         self.ok("list --version") | ||||||
|  |         eq_(self.captured, ver) | ||||||
|  |  | ||||||
|         # fail for no args |         # fail for no args | ||||||
|         self.fail("") |         self.fail("") | ||||||
|  |  | ||||||
| @@ -233,6 +239,8 @@ class TestCmdline(object): | |||||||
|         eq_(parse_time("1333648800.0"), test) |         eq_(parse_time("1333648800.0"), test) | ||||||
|         eq_(parse_time("1333648800000000"), test) |         eq_(parse_time("1333648800000000"), test) | ||||||
|         eq_(parse_time("@1333648800000000"), test) |         eq_(parse_time("@1333648800000000"), test) | ||||||
|  |         eq_(parse_time("min"), nilmdb.utils.time.min_timestamp) | ||||||
|  |         eq_(parse_time("max"), nilmdb.utils.time.max_timestamp) | ||||||
|         with assert_raises(ValueError): |         with assert_raises(ValueError): | ||||||
|             parse_time("@hashtag12345") |             parse_time("@hashtag12345") | ||||||
|  |  | ||||||
| @@ -242,8 +250,10 @@ class TestCmdline(object): | |||||||
|         self.contain("Client version: " + nilmdb.__version__) |         self.contain("Client version: " + nilmdb.__version__) | ||||||
|         self.contain("Server version: " + test_server.version) |         self.contain("Server version: " + test_server.version) | ||||||
|         self.contain("Server database path") |         self.contain("Server database path") | ||||||
|         self.contain("Server database size") |         self.contain("Server disk space used by NilmDB") | ||||||
|         self.contain("Server database free space") |         self.contain("Server disk space used by other") | ||||||
|  |         self.contain("Server disk space reserved") | ||||||
|  |         self.contain("Server disk space free") | ||||||
|  |  | ||||||
|     def test_04_createlist(self): |     def test_04_createlist(self): | ||||||
|         # Basic stream tests, like those in test_client. |         # Basic stream tests, like those in test_client. | ||||||
| @@ -297,38 +307,19 @@ class TestCmdline(object): | |||||||
|  |  | ||||||
|         # Verify we got those 3 streams and they're returned in |         # Verify we got those 3 streams and they're returned in | ||||||
|         # alphabetical order. |         # alphabetical order. | ||||||
|         self.ok("list") |         self.ok("list -l") | ||||||
|         self.match("/newton/prep float32_8\n" |         self.match("/newton/prep float32_8\n" | ||||||
|                    "/newton/raw uint16_6\n" |                    "/newton/raw uint16_6\n" | ||||||
|                    "/newton/zzz/rawnotch uint16_9\n") |                    "/newton/zzz/rawnotch uint16_9\n") | ||||||
|  |  | ||||||
|         # Match just one type or one path.  Also check |         # Match just one type or one path.  Also check | ||||||
|         # that --path is optional |         # that --path is optional | ||||||
|         self.ok("list --path /newton/raw") |         self.ok("list --layout /newton/raw") | ||||||
|         self.match("/newton/raw uint16_6\n") |  | ||||||
|  |  | ||||||
|         self.ok("list /newton/raw") |  | ||||||
|         self.match("/newton/raw uint16_6\n") |  | ||||||
|  |  | ||||||
|         self.fail("list -p /newton/raw /newton/raw") |  | ||||||
|         self.contain("too many paths") |  | ||||||
|  |  | ||||||
|         self.ok("list --layout uint16_6") |  | ||||||
|         self.match("/newton/raw uint16_6\n") |         self.match("/newton/raw uint16_6\n") | ||||||
|  |  | ||||||
|         # Wildcard matches |         # Wildcard matches | ||||||
|         self.ok("list --layout uint16*") |         self.ok("list *zzz*") | ||||||
|         self.match("/newton/raw uint16_6\n" |         self.match("/newton/zzz/rawnotch\n") | ||||||
|                    "/newton/zzz/rawnotch uint16_9\n") |  | ||||||
|  |  | ||||||
|         self.ok("list --path *zzz* --layout uint16*") |  | ||||||
|         self.match("/newton/zzz/rawnotch uint16_9\n") |  | ||||||
|  |  | ||||||
|         self.ok("list *zzz* --layout uint16*") |  | ||||||
|         self.match("/newton/zzz/rawnotch uint16_9\n") |  | ||||||
|  |  | ||||||
|         self.ok("list --path *zzz* --layout float32*") |  | ||||||
|         self.match("") |  | ||||||
|  |  | ||||||
|         # reversed range |         # reversed range | ||||||
|         self.fail("list /newton/prep --start 2020-01-01 --end 2000-01-01") |         self.fail("list /newton/prep --start 2020-01-01 --end 2000-01-01") | ||||||
| @@ -366,6 +357,8 @@ class TestCmdline(object): | |||||||
|         self.contain("No stream at path") |         self.contain("No stream at path") | ||||||
|         self.fail("metadata /newton/nosuchstream --set foo=bar") |         self.fail("metadata /newton/nosuchstream --set foo=bar") | ||||||
|         self.contain("No stream at path") |         self.contain("No stream at path") | ||||||
|  |         self.fail("metadata /newton/nosuchstream --delete") | ||||||
|  |         self.contain("No stream at path") | ||||||
|  |  | ||||||
|         self.ok("metadata /newton/prep") |         self.ok("metadata /newton/prep") | ||||||
|         self.match("description=The Data\nv_scale=1.234\n") |         self.match("description=The Data\nv_scale=1.234\n") | ||||||
| @@ -391,6 +384,19 @@ class TestCmdline(object): | |||||||
|         self.fail("metadata /newton/nosuchpath") |         self.fail("metadata /newton/nosuchpath") | ||||||
|         self.contain("No stream at path /newton/nosuchpath") |         self.contain("No stream at path /newton/nosuchpath") | ||||||
|  |  | ||||||
|  |         self.ok("metadata /newton/prep --delete") | ||||||
|  |         self.ok("metadata /newton/prep --get") | ||||||
|  |         self.match("") | ||||||
|  |         self.ok("metadata /newton/prep --set " | ||||||
|  |                 "'description=The Data' " | ||||||
|  |                 "v_scale=1.234") | ||||||
|  |         self.ok("metadata /newton/prep --delete v_scale") | ||||||
|  |         self.ok("metadata /newton/prep --get") | ||||||
|  |         self.match("description=The Data\n") | ||||||
|  |         self.ok("metadata /newton/prep --set description=") | ||||||
|  |         self.ok("metadata /newton/prep --get") | ||||||
|  |         self.match("") | ||||||
|  |  | ||||||
|     def test_06_insert(self): |     def test_06_insert(self): | ||||||
|         self.ok("insert --help") |         self.ok("insert --help") | ||||||
|  |  | ||||||
| @@ -474,33 +480,40 @@ class TestCmdline(object): | |||||||
|         # bad start time |         # bad start time | ||||||
|         self.fail("insert -t -r 120 --start 'whatever' /newton/prep /dev/null") |         self.fail("insert -t -r 120 --start 'whatever' /newton/prep /dev/null") | ||||||
|  |  | ||||||
|  |         # Test negative times | ||||||
|  |         self.ok("insert --start @-10000000000 --end @1000000001 /newton/prep" | ||||||
|  |                 " tests/data/timestamped") | ||||||
|  |         self.ok("extract -c /newton/prep --start min --end @1000000001") | ||||||
|  |         self.match("8\n") | ||||||
|  |         self.ok("remove /newton/prep --start min --end @1000000001") | ||||||
|  |  | ||||||
|     def test_07_detail_extended(self): |     def test_07_detail_extended(self): | ||||||
|         # Just count the number of lines, it's probably fine |         # Just count the number of lines, it's probably fine | ||||||
|         self.ok("list --detail") |         self.ok("list --detail") | ||||||
|         lines_(self.captured, 8) |         lines_(self.captured, 8) | ||||||
|  |  | ||||||
|         self.ok("list --detail --path *prep") |         self.ok("list --detail *prep") | ||||||
|         lines_(self.captured, 4) |         lines_(self.captured, 4) | ||||||
|  |  | ||||||
|         self.ok("list --detail --path *prep --start='23 Mar 2012 10:02'") |         self.ok("list --detail *prep --start='23 Mar 2012 10:02'") | ||||||
|         lines_(self.captured, 3) |         lines_(self.captured, 3) | ||||||
|  |  | ||||||
|         self.ok("list --detail --path *prep --start='23 Mar 2012 10:05'") |         self.ok("list --detail *prep --start='23 Mar 2012 10:05'") | ||||||
|         lines_(self.captured, 2) |         lines_(self.captured, 2) | ||||||
|  |  | ||||||
|         self.ok("list --detail --path *prep --start='23 Mar 2012 10:05:15'") |         self.ok("list --detail *prep --start='23 Mar 2012 10:05:15'") | ||||||
|         lines_(self.captured, 2) |         lines_(self.captured, 2) | ||||||
|         self.contain("10:05:15.000") |         self.contain("10:05:15.000") | ||||||
|  |  | ||||||
|         self.ok("list --detail --path *prep --start='23 Mar 2012 10:05:15.50'") |         self.ok("list --detail *prep --start='23 Mar 2012 10:05:15.50'") | ||||||
|         lines_(self.captured, 2) |         lines_(self.captured, 2) | ||||||
|         self.contain("10:05:15.500") |         self.contain("10:05:15.500") | ||||||
|  |  | ||||||
|         self.ok("list --detail --path *prep --start='23 Mar 2012 19:05:15.50'") |         self.ok("list --detail *prep --start='23 Mar 2012 19:05:15.50'") | ||||||
|         lines_(self.captured, 2) |         lines_(self.captured, 2) | ||||||
|         self.contain("no intervals") |         self.contain("no intervals") | ||||||
|  |  | ||||||
|         self.ok("list --detail --path *prep --start='23 Mar 2012 10:05:15.50'" |         self.ok("list --detail *prep --start='23 Mar 2012 10:05:15.50'" | ||||||
|                 + " --end='23 Mar 2012 10:05:15.51'") |                 + " --end='23 Mar 2012 10:05:15.51'") | ||||||
|         lines_(self.captured, 2) |         lines_(self.captured, 2) | ||||||
|         self.contain("10:05:15.500") |         self.contain("10:05:15.500") | ||||||
| @@ -509,15 +522,15 @@ class TestCmdline(object): | |||||||
|         lines_(self.captured, 8) |         lines_(self.captured, 8) | ||||||
|  |  | ||||||
|         # Verify the "raw timestamp" output |         # Verify the "raw timestamp" output | ||||||
|         self.ok("list --detail --path *prep --timestamp-raw " |         self.ok("list --detail *prep --timestamp-raw " | ||||||
|                 "--start='23 Mar 2012 10:05:15.50'") |                 "--start='23 Mar 2012 10:05:15.50'") | ||||||
|         lines_(self.captured, 2) |         lines_(self.captured, 2) | ||||||
|         self.contain("[ 1332497115500000 -> 1332497160000000 ]") |         self.contain("[ 1332497115500000 -> 1332497160000000 ]") | ||||||
|  |  | ||||||
|         # bad time |         # bad time | ||||||
|         self.fail("list --detail --path *prep -T --start='9332497115.612'") |         self.fail("list --detail *prep -T --start='9332497115.612'") | ||||||
|         # good time |         # good time | ||||||
|         self.ok("list --detail --path *prep -T --start='1332497115.612'") |         self.ok("list --detail *prep -T --start='1332497115.612'") | ||||||
|         lines_(self.captured, 2) |         lines_(self.captured, 2) | ||||||
|         self.contain("[ 1332497115612000 -> 1332497160000000 ]") |         self.contain("[ 1332497115612000 -> 1332497160000000 ]") | ||||||
|  |  | ||||||
| @@ -593,13 +606,28 @@ class TestCmdline(object): | |||||||
|         test(6, "10:00:30", "10:00:31", extra="-b") |         test(6, "10:00:30", "10:00:31", extra="-b") | ||||||
|         test(7, "10:00:30", "10:00:30.999", extra="-a -T") |         test(7, "10:00:30", "10:00:30.999", extra="-a -T") | ||||||
|         test(7, "10:00:30", "10:00:30.999", extra="-a --timestamp-raw") |         test(7, "10:00:30", "10:00:30.999", extra="-a --timestamp-raw") | ||||||
|  |         test(8, "10:01:59.9", "10:02:00.1", extra="--markup") | ||||||
|  |         test(8, "10:01:59.9", "10:02:00.1", extra="-m") | ||||||
|  |  | ||||||
|         # all data put in by tests |         # all data put in by tests | ||||||
|         self.ok("extract -a /newton/prep --start 2000-01-01 --end 2020-01-01") |         self.ok("extract -a /newton/prep --start min --end max") | ||||||
|         lines_(self.captured, 43204) |         lines_(self.captured, 43204) | ||||||
|         self.ok("extract -c /newton/prep --start 2000-01-01 --end 2020-01-01") |         self.ok("extract -c /newton/prep --start 2000-01-01 --end 2020-01-01") | ||||||
|         self.match("43200\n") |         self.match("43200\n") | ||||||
|  |  | ||||||
|  |         # test binary mode | ||||||
|  |         self.fail("extract -c -B /newton/prep -s min -e max") | ||||||
|  |         self.contain("binary cannot be combined") | ||||||
|  |         self.fail("extract -m -B /newton/prep -s min -e max") | ||||||
|  |         self.contain("binary cannot be combined") | ||||||
|  |         self.ok("extract -B /newton/prep -s min -e max") | ||||||
|  |         eq_(len(self.captured), 43200 * (8 + 8*4)) | ||||||
|  |  | ||||||
|  |         # markup for 3 intervals, plus extra markup lines whenever we had | ||||||
|  |         # a "restart" from the nilmdb.stream_extract function | ||||||
|  |         self.ok("extract -m /newton/prep --start 2000-01-01 --end 2020-01-01") | ||||||
|  |         lines_(self.captured, 43210) | ||||||
|  |  | ||||||
|     def test_09_truncated(self): |     def test_09_truncated(self): | ||||||
|         # Test truncated responses by overriding the nilmdb max_results |         # Test truncated responses by overriding the nilmdb max_results | ||||||
|         server_stop() |         server_stop() | ||||||
| @@ -614,7 +642,7 @@ class TestCmdline(object): | |||||||
|  |  | ||||||
|         # Try nonexistent stream |         # Try nonexistent stream | ||||||
|         self.fail("remove /no/such/foo --start 2000-01-01 --end 2020-01-01") |         self.fail("remove /no/such/foo --start 2000-01-01 --end 2020-01-01") | ||||||
|         self.contain("No stream at path") |         self.contain("no stream matched path") | ||||||
|  |  | ||||||
|         # empty or backward ranges return errors |         # empty or backward ranges return errors | ||||||
|         self.fail("remove /newton/prep --start 2020-01-01 --end 2000-01-01") |         self.fail("remove /newton/prep --start 2020-01-01 --end 2000-01-01") | ||||||
| @@ -642,9 +670,14 @@ class TestCmdline(object): | |||||||
|                 "--start '23 Mar 2022 20:00:30' " + |                 "--start '23 Mar 2022 20:00:30' " + | ||||||
|                 "--end '23 Mar 2022 20:00:31'") |                 "--end '23 Mar 2022 20:00:31'") | ||||||
|         self.match("0\n") |         self.match("0\n") | ||||||
|  |         self.ok("remove -c /newton/prep /newton/pre* " + | ||||||
|  |                 "--start '23 Mar 2022 20:00:30' " + | ||||||
|  |                 "--end '23 Mar 2022 20:00:31'") | ||||||
|  |         self.match("Removing from /newton/prep\n0\n" + | ||||||
|  |                    "Removing from /newton/prep\n0\n") | ||||||
|  |  | ||||||
|         # Make sure we have the data we expect |         # Make sure we have the data we expect | ||||||
|         self.ok("list --detail /newton/prep") |         self.ok("list -l --detail /newton/prep") | ||||||
|         self.match("/newton/prep float32_8\n" + |         self.match("/newton/prep float32_8\n" + | ||||||
|                    "  [ Fri, 23 Mar 2012 10:00:00.000000 +0000" |                    "  [ Fri, 23 Mar 2012 10:00:00.000000 +0000" | ||||||
|                    " -> Fri, 23 Mar 2012 10:01:59.991668 +0000 ]\n" |                    " -> Fri, 23 Mar 2012 10:01:59.991668 +0000 ]\n" | ||||||
| @@ -679,7 +712,7 @@ class TestCmdline(object): | |||||||
|         self.match("24000\n") |         self.match("24000\n") | ||||||
|  |  | ||||||
|         # See the missing chunks in list output |         # See the missing chunks in list output | ||||||
|         self.ok("list --detail /newton/prep") |         self.ok("list --layout --detail /newton/prep") | ||||||
|         self.match("/newton/prep float32_8\n" + |         self.match("/newton/prep float32_8\n" + | ||||||
|                    "  [ Fri, 23 Mar 2012 10:00:00.000000 +0000" |                    "  [ Fri, 23 Mar 2012 10:00:00.000000 +0000" | ||||||
|                    " -> Fri, 23 Mar 2012 10:00:05.000000 +0000 ]\n" |                    " -> Fri, 23 Mar 2012 10:00:05.000000 +0000 ]\n" | ||||||
| @@ -693,17 +726,15 @@ class TestCmdline(object): | |||||||
|         # Remove all data, verify it's missing |         # Remove all data, verify it's missing | ||||||
|         self.ok("remove /newton/prep --start 2000-01-01 --end 2020-01-01") |         self.ok("remove /newton/prep --start 2000-01-01 --end 2020-01-01") | ||||||
|         self.match("")  # no count requested this time |         self.match("")  # no count requested this time | ||||||
|         self.ok("list --detail /newton/prep") |         self.ok("list -l --detail /newton/prep") | ||||||
|         self.match("/newton/prep float32_8\n" + |         self.match("/newton/prep float32_8\n" + | ||||||
|                    "  (no intervals)\n") |                    "  (no intervals)\n") | ||||||
|  |  | ||||||
|         # Reinsert some data, to verify that no overlaps with deleted |         # Reinsert some data, to verify that no overlaps with deleted | ||||||
|         # data are reported |         # data are reported | ||||||
|         os.environ['TZ'] = "UTC" |         for minute in ["0", "2"]: | ||||||
|         self.ok("insert --timestamp -f --rate 120 /newton/prep " |             self.ok("insert --timestamp -f --rate 120 /newton/prep" | ||||||
|                 "tests/data/prep-20120323T1000") |                     " tests/data/prep-20120323T100" + minute) | ||||||
|         self.ok("insert -t --filename --rate 120 /newton/prep " |  | ||||||
|                 "tests/data/prep-20120323T1002") |  | ||||||
|  |  | ||||||
|     def test_11_destroy(self): |     def test_11_destroy(self): | ||||||
|         # Delete records |         # Delete records | ||||||
| @@ -713,13 +744,16 @@ class TestCmdline(object): | |||||||
|         self.contain("too few arguments") |         self.contain("too few arguments") | ||||||
|  |  | ||||||
|         self.fail("destroy /no/such/stream") |         self.fail("destroy /no/such/stream") | ||||||
|         self.contain("No stream at path") |         self.contain("no stream matched path") | ||||||
|  |  | ||||||
|  |         self.fail("destroy -R /no/such/stream") | ||||||
|  |         self.contain("no stream matched path") | ||||||
|  |  | ||||||
|         self.fail("destroy asdfasdf") |         self.fail("destroy asdfasdf") | ||||||
|         self.contain("No stream at path") |         self.contain("no stream matched path") | ||||||
|  |  | ||||||
|         # From previous tests, we have: |         # From previous tests, we have: | ||||||
|         self.ok("list") |         self.ok("list -l") | ||||||
|         self.match("/newton/prep float32_8\n" |         self.match("/newton/prep float32_8\n" | ||||||
|                    "/newton/raw uint16_6\n" |                    "/newton/raw uint16_6\n" | ||||||
|                    "/newton/zzz/rawnotch uint16_9\n") |                    "/newton/zzz/rawnotch uint16_9\n") | ||||||
| @@ -728,19 +762,26 @@ class TestCmdline(object): | |||||||
|         self.ok("list --detail") |         self.ok("list --detail") | ||||||
|         lines_(self.captured, 7) |         lines_(self.captured, 7) | ||||||
|  |  | ||||||
|         # Delete some |         # Fail to destroy because intervals still present | ||||||
|         self.ok("destroy /newton/prep") |         self.fail("destroy /newton/prep") | ||||||
|         self.ok("list") |         self.contain("all intervals must be removed") | ||||||
|  |         self.ok("list --detail") | ||||||
|  |         lines_(self.captured, 7) | ||||||
|  |  | ||||||
|  |         # Destroy for real | ||||||
|  |         self.ok("destroy -R /n*/prep") | ||||||
|  |         self.ok("list -l") | ||||||
|         self.match("/newton/raw uint16_6\n" |         self.match("/newton/raw uint16_6\n" | ||||||
|                    "/newton/zzz/rawnotch uint16_9\n") |                    "/newton/zzz/rawnotch uint16_9\n") | ||||||
|  |  | ||||||
|         self.ok("destroy /newton/zzz/rawnotch") |         self.ok("destroy /newton/zzz/rawnotch") | ||||||
|         self.ok("list") |         self.ok("list -l") | ||||||
|         self.match("/newton/raw uint16_6\n") |         self.match("/newton/raw uint16_6\n") | ||||||
|  |  | ||||||
|         self.ok("destroy /newton/raw") |         self.ok("destroy /newton/raw") | ||||||
|         self.ok("create /newton/raw uint16_6") |         self.ok("create /newton/raw uint16_6") | ||||||
|         self.ok("destroy /newton/raw") |         # Specify --remove with no data | ||||||
|  |         self.ok("destroy --remove /newton/raw") | ||||||
|         self.ok("list") |         self.ok("list") | ||||||
|         self.match("") |         self.match("") | ||||||
|  |  | ||||||
| @@ -753,18 +794,17 @@ class TestCmdline(object): | |||||||
|             self.ok("list") |             self.ok("list") | ||||||
|             self.contain(path) |             self.contain(path) | ||||||
|             # Make sure it was created empty |             # Make sure it was created empty | ||||||
|             self.ok("list --detail --path " + path) |             self.ok("list --detail " + path) | ||||||
|             self.contain("(no intervals)") |             self.contain("(no intervals)") | ||||||
|  |  | ||||||
|     def test_12_unicode(self): |     def test_12_unicode(self): | ||||||
|         # Unicode paths. |         # Unicode paths. | ||||||
|         self.ok("destroy /newton/asdf/qwer") |         self.ok("destroy /newton/asdf/qwer") | ||||||
|         self.ok("destroy /newton/prep") |         self.ok("destroy /newton/prep /newton/raw") | ||||||
|         self.ok("destroy /newton/raw") |  | ||||||
|         self.ok("destroy /newton/zzz") |         self.ok("destroy /newton/zzz") | ||||||
|  |  | ||||||
|         self.ok(u"create /düsseldorf/raw uint16_6") |         self.ok(u"create /düsseldorf/raw uint16_6") | ||||||
|         self.ok("list --detail") |         self.ok("list -l --detail") | ||||||
|         self.contain(u"/düsseldorf/raw uint16_6") |         self.contain(u"/düsseldorf/raw uint16_6") | ||||||
|         self.contain("(no intervals)") |         self.contain("(no intervals)") | ||||||
|  |  | ||||||
| @@ -815,7 +855,7 @@ class TestCmdline(object): | |||||||
|  |  | ||||||
|         # Now recreate the data one more time and make sure there are |         # Now recreate the data one more time and make sure there are | ||||||
|         # fewer files. |         # fewer files. | ||||||
|         self.ok("destroy /newton/prep") |         self.ok("destroy --remove /newton/prep") | ||||||
|         self.fail("destroy /newton/prep") # already destroyed |         self.fail("destroy /newton/prep") # already destroyed | ||||||
|         self.ok("create /newton/prep float32_8") |         self.ok("create /newton/prep float32_8") | ||||||
|         os.environ['TZ'] = "UTC" |         os.environ['TZ'] = "UTC" | ||||||
| @@ -826,14 +866,16 @@ class TestCmdline(object): | |||||||
|         for (dirpath, dirnames, filenames) in os.walk(testdb): |         for (dirpath, dirnames, filenames) in os.walk(testdb): | ||||||
|             nfiles += len(filenames) |             nfiles += len(filenames) | ||||||
|         lt_(nfiles, 50) |         lt_(nfiles, 50) | ||||||
|         self.ok("destroy /newton/prep") # destroy again |         self.ok("destroy -R /newton/prep") # destroy again | ||||||
|  |  | ||||||
|     def test_14_remove_files(self): |     def test_14_remove_files(self): | ||||||
|         # Test BulkData's ability to remove when data is split into |         # Test BulkData's ability to remove when data is split into | ||||||
|         # multiple files.  Should be a fairly comprehensive test of |         # multiple files.  Should be a fairly comprehensive test of | ||||||
|         # remove functionality. |         # remove functionality. | ||||||
|  |         # Also limit max_removals, to cover more functionality. | ||||||
|         server_stop() |         server_stop() | ||||||
|         server_start(bulkdata_args = { "file_size" : 920, # 23 rows per file |         server_start(max_removals = 4321, | ||||||
|  |                      bulkdata_args = { "file_size" : 920, # 23 rows per file | ||||||
|                                        "files_per_dir" : 3 }) |                                        "files_per_dir" : 3 }) | ||||||
|  |  | ||||||
|         # Insert data.  Just for fun, insert out of order |         # Insert data.  Just for fun, insert out of order | ||||||
| @@ -848,7 +890,7 @@ class TestCmdline(object): | |||||||
|         du_before = nilmdb.utils.diskusage.du(testdb) |         du_before = nilmdb.utils.diskusage.du(testdb) | ||||||
|  |  | ||||||
|         # Make sure we have the data we expect |         # Make sure we have the data we expect | ||||||
|         self.ok("list --detail") |         self.ok("list -l --detail") | ||||||
|         self.match("/newton/prep float32_8\n" + |         self.match("/newton/prep float32_8\n" + | ||||||
|                    "  [ Fri, 23 Mar 2012 10:00:00.000000 +0000" |                    "  [ Fri, 23 Mar 2012 10:00:00.000000 +0000" | ||||||
|                    " -> Fri, 23 Mar 2012 10:01:59.991668 +0000 ]\n" |                    " -> Fri, 23 Mar 2012 10:01:59.991668 +0000 ]\n" | ||||||
| @@ -884,7 +926,7 @@ class TestCmdline(object): | |||||||
|         self.match("3600\n") |         self.match("3600\n") | ||||||
|  |  | ||||||
|         # See the missing chunks in list output |         # See the missing chunks in list output | ||||||
|         self.ok("list --detail") |         self.ok("list -l --detail") | ||||||
|         self.match("/newton/prep float32_8\n" + |         self.match("/newton/prep float32_8\n" + | ||||||
|                    "  [ Fri, 23 Mar 2012 10:00:00.000000 +0000" |                    "  [ Fri, 23 Mar 2012 10:00:00.000000 +0000" | ||||||
|                    " -> Fri, 23 Mar 2012 10:00:05.000000 +0000 ]\n" |                    " -> Fri, 23 Mar 2012 10:00:05.000000 +0000 ]\n" | ||||||
| @@ -974,8 +1016,20 @@ class TestCmdline(object): | |||||||
|         self.match("[ Thu, 01 Jan 2004 00:00:00.000000 +0000 -" |         self.match("[ Thu, 01 Jan 2004 00:00:00.000000 +0000 -" | ||||||
|                    "> Sat, 01 Jan 2005 00:00:00.000000 +0000 ]\n") |                    "> Sat, 01 Jan 2005 00:00:00.000000 +0000 ]\n") | ||||||
|  |  | ||||||
|         self.ok("destroy /diff/1") |         # optimize | ||||||
|         self.ok("destroy /diff/2") |         self.ok("insert -s 01-01-2002 -e 01-01-2004 /diff/1 /dev/null") | ||||||
|  |         self.ok("intervals /diff/1") | ||||||
|  |         self.match("[ Sat, 01 Jan 2000 00:00:00.000000 +0000 -" | ||||||
|  |                    "> Thu, 01 Jan 2004 00:00:00.000000 +0000 ]\n" | ||||||
|  |                    "[ Thu, 01 Jan 2004 00:00:00.000000 +0000 -" | ||||||
|  |                    "> Sat, 01 Jan 2005 00:00:00.000000 +0000 ]\n") | ||||||
|  |         self.ok("intervals /diff/1 --optimize") | ||||||
|  |         self.ok("intervals /diff/1 -o") | ||||||
|  |         self.match("[ Sat, 01 Jan 2000 00:00:00.000000 +0000 -" | ||||||
|  |                    "> Sat, 01 Jan 2005 00:00:00.000000 +0000 ]\n") | ||||||
|  |  | ||||||
|  |         self.ok("destroy -R /diff/1") | ||||||
|  |         self.ok("destroy -R /diff/2") | ||||||
|  |  | ||||||
|     def test_16_rename(self): |     def test_16_rename(self): | ||||||
|         # Test renaming.  Force file size smaller so we get more files |         # Test renaming.  Force file size smaller so we get more files | ||||||
| @@ -1008,7 +1062,7 @@ class TestCmdline(object): | |||||||
|             else: |             else: | ||||||
|                 raise AssertionError("data not found at " + seek) |                 raise AssertionError("data not found at " + seek) | ||||||
|             # Verify "list" output |             # Verify "list" output | ||||||
|             self.ok("list") |             self.ok("list -l") | ||||||
|             self.match("/" + "/".join(components) + " float32_8\n") |             self.match("/" + "/".join(components) + " float32_8\n") | ||||||
|  |  | ||||||
|         # Lots of renames |         # Lots of renames | ||||||
| @@ -1018,10 +1072,12 @@ class TestCmdline(object): | |||||||
|         self.contain("old and new paths are the same") |         self.contain("old and new paths are the same") | ||||||
|         check_path("newton", "prep") |         check_path("newton", "prep") | ||||||
|         self.fail("rename /newton/prep /newton") |         self.fail("rename /newton/prep /newton") | ||||||
|         self.contain("subdirs of this path already exist") |         self.contain("path must contain at least one folder") | ||||||
|         self.fail("rename /newton/prep /newton/prep/") |         self.fail("rename /newton/prep /newton/prep/") | ||||||
|         self.contain("invalid path") |         self.contain("invalid path") | ||||||
|         self.ok("rename /newton/prep /newton/foo") |         self.ok("rename /newton/prep /newton/foo/1") | ||||||
|  |         check_path("newton", "foo", "1") | ||||||
|  |         self.ok("rename /newton/foo/1 /newton/foo") | ||||||
|         check_path("newton", "foo") |         check_path("newton", "foo") | ||||||
|         self.ok("rename /newton/foo /totally/different/thing") |         self.ok("rename /newton/foo /totally/different/thing") | ||||||
|         check_path("totally", "different", "thing") |         check_path("totally", "different", "thing") | ||||||
| @@ -1039,7 +1095,7 @@ class TestCmdline(object): | |||||||
|         self.fail("rename /foo/bar /xxx/yyy/zzz/www") |         self.fail("rename /foo/bar /xxx/yyy/zzz/www") | ||||||
|         self.contain("path is subdir of existing node") |         self.contain("path is subdir of existing node") | ||||||
|         self.ok("rename /foo/bar /xxx/yyy/mmm") |         self.ok("rename /foo/bar /xxx/yyy/mmm") | ||||||
|         self.ok("destroy /xxx/yyy/zzz") |         self.ok("destroy -R /xxx/yyy/zzz") | ||||||
|         check_path("xxx", "yyy", "mmm") |         check_path("xxx", "yyy", "mmm") | ||||||
|  |  | ||||||
|         # Extract it at the final path |         # Extract it at the final path | ||||||
| @@ -1047,7 +1103,7 @@ class TestCmdline(object): | |||||||
|                 "--end '2012-03-23 10:04:01'") |                 "--end '2012-03-23 10:04:01'") | ||||||
|         eq_(self.captured, extract_before) |         eq_(self.captured, extract_before) | ||||||
|  |  | ||||||
|         self.ok("destroy /xxx/yyy/mmm") |         self.ok("destroy -R /xxx/yyy/mmm") | ||||||
|  |  | ||||||
|         # Make sure temporary rename dirs weren't left around |         # Make sure temporary rename dirs weren't left around | ||||||
|         for (dirpath, dirnames, filenames) in os.walk(testdb): |         for (dirpath, dirnames, filenames) in os.walk(testdb): | ||||||
|   | |||||||
| @@ -8,8 +8,11 @@ from nose.tools import * | |||||||
| from nose.tools import assert_raises | from nose.tools import assert_raises | ||||||
| import itertools | import itertools | ||||||
|  |  | ||||||
| from nilmdb.server.interval import (Interval, DBInterval, | from nilmdb.utils.interval import IntervalError | ||||||
|                                     IntervalSet, IntervalError) | from nilmdb.server.interval import Interval, DBInterval, IntervalSet | ||||||
|  |  | ||||||
|  | # so we can test them separately | ||||||
|  | from nilmdb.utils.interval import Interval as UtilsInterval | ||||||
|  |  | ||||||
| from testutil.helpers import * | from testutil.helpers import * | ||||||
| import unittest | import unittest | ||||||
| @@ -47,6 +50,23 @@ def makeset(string): | |||||||
|     return iset |     return iset | ||||||
|  |  | ||||||
| class TestInterval: | class TestInterval: | ||||||
|  |     def test_client_interval(self): | ||||||
|  |         # Run interval tests against the Python version of Interval. | ||||||
|  |         global Interval | ||||||
|  |         NilmdbInterval = Interval | ||||||
|  |         Interval = UtilsInterval | ||||||
|  |         self.test_interval() | ||||||
|  |         self.test_interval_intersect() | ||||||
|  |         Interval = NilmdbInterval | ||||||
|  |  | ||||||
|  |         # Other helpers in nilmdb.utils.interval | ||||||
|  |         i = [ UtilsInterval(1,2), UtilsInterval(2,3), UtilsInterval(4,5) ] | ||||||
|  |         eq_(list(nilmdb.utils.interval.optimize(i)), | ||||||
|  |             [ UtilsInterval(1,3), UtilsInterval(4,5) ]) | ||||||
|  |         eq_(UtilsInterval(1234567890123456, 1234567890654321).human_string(), | ||||||
|  |             "[ Fri, 13 Feb 2009 18:31:30.123456 -0500 -> " + | ||||||
|  |             "Fri, 13 Feb 2009 18:31:30.654321 -0500 ]") | ||||||
|  |  | ||||||
|     def test_interval(self): |     def test_interval(self): | ||||||
|         # Test Interval class |         # Test Interval class | ||||||
|         os.environ['TZ'] = "America/New_York" |         os.environ['TZ'] = "America/New_York" | ||||||
| @@ -214,15 +234,18 @@ class TestInterval: | |||||||
|             x = makeset("[--)") & 1234 |             x = makeset("[--)") & 1234 | ||||||
|  |  | ||||||
|         def do_test(a, b, c, d): |         def do_test(a, b, c, d): | ||||||
|             # a & b == c |             # a & b == c (using nilmdb.server.interval) | ||||||
|             ab = IntervalSet() |             ab = IntervalSet() | ||||||
|             for x in b: |             for x in b: | ||||||
|                 for i in (a & x): |                 for i in (a & x): | ||||||
|                     ab += i |                     ab += i | ||||||
|             eq_(ab,c) |             eq_(ab,c) | ||||||
|  |  | ||||||
|  |             # a & b == c (using nilmdb.utils.interval) | ||||||
|  |             eq_(IntervalSet(nilmdb.utils.interval.intersection(a,b)), c) | ||||||
|  |  | ||||||
|             # a \ b == d |             # a \ b == d | ||||||
|             eq_(IntervalSet(a.set_difference(b)), d) |             eq_(IntervalSet(nilmdb.utils.interval.set_difference(a,b)), d) | ||||||
|  |  | ||||||
|         # Intersection with intervals |         # Intersection with intervals | ||||||
|         do_test(makeset("[---|---)[)"), |         do_test(makeset("[---|---)[)"), | ||||||
| @@ -287,10 +310,22 @@ class TestInterval: | |||||||
|         b = makeset("[-) [--) [)") |         b = makeset("[-) [--) [)") | ||||||
|         c = makeset("[----)     ") |         c = makeset("[----)     ") | ||||||
|         d = makeset("  [-)      ") |         d = makeset("  [-)      ") | ||||||
|         eq_(a.set_difference(b, list(c)[0]), d) |         eq_(nilmdb.utils.interval.set_difference( | ||||||
|  |             a.intersection(list(c)[0]), b.intersection(list(c)[0])), d) | ||||||
|  |  | ||||||
|  |         # Fill out test coverage for non-subsets | ||||||
|  |         def diff2(a,b, subset): | ||||||
|  |             return nilmdb.utils.interval._interval_math_helper( | ||||||
|  |                 a, b, (lambda a, b: b and not a), subset=subset) | ||||||
|  |         with assert_raises(nilmdb.utils.interval.IntervalError): | ||||||
|  |             list(diff2(a,b,True)) | ||||||
|  |         list(diff2(a,b,False)) | ||||||
|  |  | ||||||
|         # Empty second set |         # Empty second set | ||||||
|         eq_(a.set_difference(IntervalSet()), a) |         eq_(nilmdb.utils.interval.set_difference(a, IntervalSet()), a) | ||||||
|  |  | ||||||
|  |         # Empty second set | ||||||
|  |         eq_(nilmdb.utils.interval.set_difference(a, IntervalSet()), a) | ||||||
|  |  | ||||||
| class TestIntervalDB: | class TestIntervalDB: | ||||||
|     def test_dbinterval(self): |     def test_dbinterval(self): | ||||||
| @@ -372,14 +407,13 @@ class TestIntervalSpeed: | |||||||
|     def test_interval_speed(self): |     def test_interval_speed(self): | ||||||
|         import yappi |         import yappi | ||||||
|         import time |         import time | ||||||
|         import testutil.aplotter as aplotter |  | ||||||
|         import random |         import random | ||||||
|         import math |         import math | ||||||
|  |  | ||||||
|         print |         print | ||||||
|         yappi.start() |         yappi.start() | ||||||
|         speeds = {} |         speeds = {} | ||||||
|         limit = 10 # was 20 |         limit = 22 # was 20 | ||||||
|         for j in [ 2**x for x in range(5,limit) ]: |         for j in [ 2**x for x in range(5,limit) ]: | ||||||
|             start = time.time() |             start = time.time() | ||||||
|             iset = IntervalSet() |             iset = IntervalSet() | ||||||
| @@ -393,6 +427,5 @@ class TestIntervalSpeed: | |||||||
|                    speed/j, |                    speed/j, | ||||||
|                    speed / (j*math.log(j))) # should be constant |                    speed / (j*math.log(j))) # should be constant | ||||||
|             speeds[j] = speed |             speeds[j] = speed | ||||||
|         aplotter.plot(speeds.keys(), speeds.values(), plot_slope=True) |  | ||||||
|         yappi.stop() |         yappi.stop() | ||||||
|         yappi.print_stats(sort_type=yappi.SORTTYPE_TTOT, limit=10) |         yappi.print_stats(sort_type=yappi.SORTTYPE_TTOT, limit=10) | ||||||
|   | |||||||
| @@ -1,61 +0,0 @@ | |||||||
| import nilmdb |  | ||||||
| from nilmdb.utils.printf import * |  | ||||||
|  |  | ||||||
| import nose |  | ||||||
| from nose.tools import * |  | ||||||
| from nose.tools import assert_raises |  | ||||||
| import threading |  | ||||||
| import time |  | ||||||
|  |  | ||||||
| from testutil.helpers import * |  | ||||||
|  |  | ||||||
| def func_with_callback(a, b, callback): |  | ||||||
|     callback(a) |  | ||||||
|     callback(b) |  | ||||||
|     callback(a+b) |  | ||||||
|     return "return value" |  | ||||||
|  |  | ||||||
| class TestIteratorizer(object): |  | ||||||
|     def test(self): |  | ||||||
|  |  | ||||||
|         # First try it with a normal callback |  | ||||||
|         self.result = "" |  | ||||||
|         def cb(x): |  | ||||||
|             self.result += str(x) |  | ||||||
|         func_with_callback(1, 2, cb) |  | ||||||
|         eq_(self.result, "123") |  | ||||||
|  |  | ||||||
|         # Now make it an iterator |  | ||||||
|         result = "" |  | ||||||
|         f = lambda x: func_with_callback(1, 2, x) |  | ||||||
|         with nilmdb.utils.Iteratorizer(f) as it: |  | ||||||
|             for i in it: |  | ||||||
|                 result += str(i) |  | ||||||
|         eq_(result, "123") |  | ||||||
|         eq_(it.retval, "return value") |  | ||||||
|  |  | ||||||
|         # Make sure things work when an exception occurs |  | ||||||
|         result = "" |  | ||||||
|         with nilmdb.utils.Iteratorizer( |  | ||||||
|             lambda x: func_with_callback(1, "a", x)) as it: |  | ||||||
|             with assert_raises(TypeError) as e: |  | ||||||
|                 for i in it: |  | ||||||
|                     result += str(i) |  | ||||||
|         eq_(result, "1a") |  | ||||||
|  |  | ||||||
|         # Now try to trigger the case where we stop iterating |  | ||||||
|         # mid-generator, and expect the iteratorizer to clean up after |  | ||||||
|         # itself.  This doesn't have a particular result in the test, |  | ||||||
|         # but gains coverage. |  | ||||||
|         def foo(): |  | ||||||
|             with nilmdb.utils.Iteratorizer(f) as it: |  | ||||||
|                 it.next() |  | ||||||
|         foo() |  | ||||||
|         eq_(it.retval, None) |  | ||||||
|  |  | ||||||
|         # Do the same thing when the curl hack is applied |  | ||||||
|         def foo(): |  | ||||||
|             with nilmdb.utils.Iteratorizer(f, curl_hack = True) as it: |  | ||||||
|                 it.next() |  | ||||||
|         foo() |  | ||||||
|         eq_(it.retval, None) |  | ||||||
| @@ -1,266 +0,0 @@ | |||||||
| # -*- coding: utf-8 -*- |  | ||||||
|  |  | ||||||
| import nilmdb |  | ||||||
|  |  | ||||||
| from nilmdb.utils.printf import * |  | ||||||
|  |  | ||||||
| from nose.tools import * |  | ||||||
| from nose.tools import assert_raises |  | ||||||
| import distutils.version |  | ||||||
| import itertools |  | ||||||
| import os |  | ||||||
| import sys |  | ||||||
| import random |  | ||||||
| import unittest |  | ||||||
|  |  | ||||||
| from testutil.helpers import * |  | ||||||
|  |  | ||||||
| from nilmdb.server.layout import * |  | ||||||
|  |  | ||||||
| class TestLayouts(object): |  | ||||||
|     # Some nilmdb.layout tests.  Not complete, just fills in missing |  | ||||||
|     # coverage. |  | ||||||
|     def test_layouts(self): |  | ||||||
|         x = nilmdb.server.layout.get_named("float32_8") |  | ||||||
|         y = nilmdb.server.layout.get_named("float32_8") |  | ||||||
|         eq_(x.count, y.count) |  | ||||||
|         eq_(x.datatype, y.datatype) |  | ||||||
|         y = nilmdb.server.layout.get_named("float32_7") |  | ||||||
|         ne_(x.count, y.count) |  | ||||||
|         eq_(x.datatype, y.datatype) |  | ||||||
|  |  | ||||||
|     def test_parsing(self): |  | ||||||
|         self.real_t_parsing("float32_8", "uint16_6", "uint16_9") |  | ||||||
|         self.real_t_parsing("float32_8", "uint16_6", "uint16_9") |  | ||||||
|     def real_t_parsing(self, name_prep, name_raw, name_rawnotch): |  | ||||||
|         # invalid layouts |  | ||||||
|         with assert_raises(TypeError) as e: |  | ||||||
|             parser = Parser("NoSuchLayout") |  | ||||||
|         with assert_raises(TypeError) as e: |  | ||||||
|             parser = Parser("float32") |  | ||||||
|  |  | ||||||
|         # too little data |  | ||||||
|         parser = Parser(name_prep) |  | ||||||
|         data = ( "1234567890.000000 1.1 2.2 3.3 4.4 5.5\n" + |  | ||||||
|                  "1234567890.100000 1.1 2.2 3.3 4.4 5.5\n") |  | ||||||
|         with assert_raises(ParserError) as e: |  | ||||||
|             parser.parse(data) |  | ||||||
|         in_("error", str(e.exception)) |  | ||||||
|  |  | ||||||
|         # too much data |  | ||||||
|         parser = Parser(name_prep) |  | ||||||
|         data = ( "1234567890.000000 1.1 2.2 3.3 4.4 5.5 6.6 7.7 8.8 9.9\n" + |  | ||||||
|                  "1234567890.100000 1.1 2.2 3.3 4.4 5.5 6.6 7.7 8.8 9.9\n") |  | ||||||
|         with assert_raises(ParserError) as e: |  | ||||||
|             parser.parse(data) |  | ||||||
|         in_("error", str(e.exception)) |  | ||||||
|  |  | ||||||
|         # just right |  | ||||||
|         parser = Parser(name_prep) |  | ||||||
|         data = ( "1234567890.000000 1.1 2.2 3.3 4.4 5.5 6.6 7.7 8.8\n" + |  | ||||||
|                  "1234567890.100000 1.1 2.2 3.3 4.4 5.5 6.6 7.7 8.8\n") |  | ||||||
|         parser.parse(data) |  | ||||||
|         eq_(parser.min_timestamp, 1234567890.0) |  | ||||||
|         eq_(parser.max_timestamp, 1234567890.1) |  | ||||||
|         eq_(parser.data, [[1234567890.0,1.1,2.2,3.3,4.4,5.5,6.6,7.7,8.8], |  | ||||||
|                           [1234567890.1,1.1,2.2,3.3,4.4,5.5,6.6,7.7,8.8]]) |  | ||||||
|  |  | ||||||
|         # try uint16_6 too, with clamping |  | ||||||
|         parser = Parser(name_raw) |  | ||||||
|         data = ( "1234567890.000000 1 2 3 4 5 6\n" + |  | ||||||
|                  "1234567890.100000 1 2 3 4 5 6\n" ) |  | ||||||
|         parser.parse(data) |  | ||||||
|         eq_(parser.data, [[1234567890.0,1,2,3,4,5,6], |  | ||||||
|                           [1234567890.1,1,2,3,4,5,6]]) |  | ||||||
|  |  | ||||||
|         # pass an instantiated class |  | ||||||
|         parser = Parser(get_named(name_rawnotch)) |  | ||||||
|         data = ( "1234567890.000000 1 2 3 4 5 6 7 8 9\n" + |  | ||||||
|                  "1234567890.100000 1 2 3 4 5 6 7 8 9\n" ) |  | ||||||
|         parser.parse(data) |  | ||||||
|  |  | ||||||
|         # non-monotonic |  | ||||||
|         parser = Parser(name_raw) |  | ||||||
|         data = ( "1234567890.100000 1 2 3 4 5 6\n" + |  | ||||||
|                  "1234567890.099999 1 2 3 4 5 6\n" ) |  | ||||||
|         with assert_raises(ParserError) as e: |  | ||||||
|             parser.parse(data) |  | ||||||
|         in_("not monotonically increasing", str(e.exception)) |  | ||||||
|  |  | ||||||
|         parser = Parser(name_raw) |  | ||||||
|         data = ( "1234567890.100000 1 2 3 4 5 6\n" + |  | ||||||
|                  "1234567890.100000 1 2 3 4 5 6\n" ) |  | ||||||
|         with assert_raises(ParserError) as e: |  | ||||||
|             parser.parse(data) |  | ||||||
|         in_("not monotonically increasing", str(e.exception)) |  | ||||||
|  |  | ||||||
|         parser = Parser(name_raw) |  | ||||||
|         data = ( "1234567890.100000 1 2 3 4 5 6\n" + |  | ||||||
|                  "1234567890.100001 1 2 3 4 5 6\n" ) |  | ||||||
|         parser.parse(data) |  | ||||||
|  |  | ||||||
|         # uint16_6 with values out of bounds |  | ||||||
|         parser = Parser(name_raw) |  | ||||||
|         data = ( "1234567890.000000 1 2 3 4 500000 6\n" + |  | ||||||
|                  "1234567890.100000 1 2 3 4 5 6\n" ) |  | ||||||
|         with assert_raises(ParserError) as e: |  | ||||||
|             parser.parse(data) |  | ||||||
|         in_("value out of range", str(e.exception)) |  | ||||||
|  |  | ||||||
|         # Empty data should work but is useless |  | ||||||
|         parser = Parser(name_raw) |  | ||||||
|         data = "" |  | ||||||
|         parser.parse(data) |  | ||||||
|         assert(parser.min_timestamp is None) |  | ||||||
|         assert(parser.max_timestamp is None) |  | ||||||
|  |  | ||||||
|     def test_formatting(self): |  | ||||||
|         self.real_t_formatting("float32_8", "uint16_6", "uint16_9") |  | ||||||
|         self.real_t_formatting("float32_8", "uint16_6", "uint16_9") |  | ||||||
|     def real_t_formatting(self, name_prep, name_raw, name_rawnotch): |  | ||||||
|         # invalid layout |  | ||||||
|         with assert_raises(TypeError) as e: |  | ||||||
|             formatter = Formatter("NoSuchLayout") |  | ||||||
|  |  | ||||||
|         # too little data |  | ||||||
|         formatter = Formatter(name_prep) |  | ||||||
|         data = [ [ 1234567890.000000, 1.1, 2.2, 3.3, 4.4, 5.5 ], |  | ||||||
|                  [ 1234567890.100000, 1.1, 2.2, 3.3, 4.4, 5.5 ] ] |  | ||||||
|         with assert_raises(FormatterError) as e: |  | ||||||
|             formatter.format(data) |  | ||||||
|         in_("error", str(e.exception)) |  | ||||||
|  |  | ||||||
|         # too much data |  | ||||||
|         formatter = Formatter(name_prep) |  | ||||||
|         data = [ [ 1234567890.000000, 1, 2, 3, 4, 5, 6, 7, 8, 9 ], |  | ||||||
|                  [ 1234567890.100000, 1, 2, 3, 4, 5, 6, 7, 8, 9 ] ] |  | ||||||
|         with assert_raises(FormatterError) as e: |  | ||||||
|             formatter.format(data) |  | ||||||
|         in_("error", str(e.exception)) |  | ||||||
|  |  | ||||||
|         # just right |  | ||||||
|         formatter = Formatter(name_prep) |  | ||||||
|         data = [ [ 1234567890.000000, 1.1, 2.2, 3.3, 4.4, 5.5, 6.6, 7.7, 8.8 ], |  | ||||||
|                  [ 1234567890.100000, 1.1, 2.2, 3.3, 4.4, 5.5, 6.6, 7.7, 8.8 ] ] |  | ||||||
|         text = formatter.format(data) |  | ||||||
|         eq_(text, |  | ||||||
|             "1234567890.000000 1.100000e+00 2.200000e+00 3.300000e+00 " |  | ||||||
|             "4.400000e+00 5.500000e+00 6.600000e+00 7.700000e+00 " |  | ||||||
|             "8.800000e+00\n" + |  | ||||||
|             "1234567890.100000 1.100000e+00 2.200000e+00 3.300000e+00 " |  | ||||||
|             "4.400000e+00 5.500000e+00 6.600000e+00 7.700000e+00 " |  | ||||||
|             "8.800000e+00\n") |  | ||||||
|  |  | ||||||
|         # try uint16_6 too |  | ||||||
|         formatter = Formatter(name_raw) |  | ||||||
|         data = [ [ 1234567890.000000, 1, 2, 3, 4, 5, 6 ], |  | ||||||
|                  [ 1234567890.100000, 1, 2, 3, 4, 5, 6 ] ] |  | ||||||
|         text = formatter.format(data) |  | ||||||
|         eq_(text, |  | ||||||
|             "1234567890.000000 1 2 3 4 5 6\n" + |  | ||||||
|             "1234567890.100000 1 2 3 4 5 6\n") |  | ||||||
|  |  | ||||||
|         # pass an instantiated class |  | ||||||
|         formatter = Formatter(get_named(name_rawnotch)) |  | ||||||
|         data = [ [ 1234567890.000000, 1, 2, 3, 4, 5, 6, 7, 8, 9 ], |  | ||||||
|                  [ 1234567890.100000, 1, 2, 3, 4, 5, 6, 7, 8, 9 ] ] |  | ||||||
|         text = formatter.format(data) |  | ||||||
|         eq_(text, |  | ||||||
|             "1234567890.000000 1 2 3 4 5 6 7 8 9\n" + |  | ||||||
|             "1234567890.100000 1 2 3 4 5 6 7 8 9\n") |  | ||||||
|  |  | ||||||
|         # Empty data should work but is useless |  | ||||||
|         formatter = Formatter(name_raw) |  | ||||||
|         data = [] |  | ||||||
|         text = formatter.format(data) |  | ||||||
|         eq_(text, "") |  | ||||||
|  |  | ||||||
|     def test_roundtrip(self): |  | ||||||
|         self.real_t_roundtrip("float32_8", "uint16_6", "uint16_9") |  | ||||||
|         self.real_t_roundtrip("float32_8", "uint16_6", "uint16_9") |  | ||||||
|     def real_t_roundtrip(self, name_prep, name_raw, name_rawnotch): |  | ||||||
|         # Verify that textual data passed into the Parser, and then |  | ||||||
|         # back through the Formatter, then back into the Parser, |  | ||||||
|         # gives identical parsed representations |  | ||||||
|         random.seed(12345) |  | ||||||
|  |  | ||||||
|         def do_roundtrip(layout, datagen): |  | ||||||
|             for i in range(100): |  | ||||||
|                 rows = random.randint(1,100) |  | ||||||
|                 data = "" |  | ||||||
|                 ts = 1234567890 |  | ||||||
|                 for r in range(rows): |  | ||||||
|                     ts += random.uniform(0,1) |  | ||||||
|                     row = sprintf("%f", ts) + " " |  | ||||||
|                     row += " ".join(datagen()) |  | ||||||
|                     row += "\n" |  | ||||||
|                     data += row |  | ||||||
|                 parser1 = Parser(layout) |  | ||||||
|                 formatter = Formatter(layout) |  | ||||||
|                 parser2 = Parser(layout) |  | ||||||
|                 parser1.parse(data) |  | ||||||
|                 parser2.parse(formatter.format(parser1.data)) |  | ||||||
|                 eq_(parser1.data, parser2.data) |  | ||||||
|  |  | ||||||
|         def datagen(): |  | ||||||
|             return [ sprintf("%.6e", random.uniform(-1000,1000)) |  | ||||||
|                      for x in range(8) ] |  | ||||||
|         do_roundtrip(name_prep, datagen) |  | ||||||
|  |  | ||||||
|         def datagen(): |  | ||||||
|             return [ sprintf("%d", random.randint(0,65535)) |  | ||||||
|                      for x in range(6) ] |  | ||||||
|         do_roundtrip(name_raw, datagen) |  | ||||||
|  |  | ||||||
|         def datagen(): |  | ||||||
|             return [ sprintf("%d", random.randint(0,65535)) |  | ||||||
|                      for x in range(9) ] |  | ||||||
|         do_roundtrip(name_rawnotch, datagen) |  | ||||||
|  |  | ||||||
| class TestLayoutSpeed: |  | ||||||
|     @unittest.skip("this is slow") |  | ||||||
|     def test_layout_speed(self): |  | ||||||
|         import time |  | ||||||
|  |  | ||||||
|         random.seed(54321) |  | ||||||
|  |  | ||||||
|         def do_speedtest(layout, datagen, rows = 5000, times = 100): |  | ||||||
|             # Build data once |  | ||||||
|             data = "" |  | ||||||
|             ts = 1234567890 |  | ||||||
|             for r in range(rows): |  | ||||||
|                 ts += random.uniform(0,1) |  | ||||||
|                 row = sprintf("%f", ts) + " " |  | ||||||
|                 row += " ".join(datagen()) |  | ||||||
|                 row += "\n" |  | ||||||
|                 data += row |  | ||||||
|  |  | ||||||
|             # Do lots of roundtrips |  | ||||||
|             start = time.time() |  | ||||||
|             for i in range(times): |  | ||||||
|                 parser = Parser(layout) |  | ||||||
|                 formatter = Formatter(layout) |  | ||||||
|                 parser.parse(data) |  | ||||||
|                 formatter.format(parser.data) |  | ||||||
|             elapsed = time.time() - start |  | ||||||
|             printf("roundtrip %s: %d ms, %.1f μs/row, %d rows/sec\n", |  | ||||||
|                    layout, |  | ||||||
|                    elapsed * 1e3, |  | ||||||
|                    (elapsed * 1e6) / (rows * times), |  | ||||||
|                    (rows * times) / elapsed) |  | ||||||
|  |  | ||||||
|         print "" |  | ||||||
|         def datagen(): |  | ||||||
|             return [ sprintf("%.6e", random.uniform(-1000,1000)) |  | ||||||
|                      for x in range(10) ] |  | ||||||
|         do_speedtest("float32_10", datagen) |  | ||||||
|  |  | ||||||
|         def datagen(): |  | ||||||
|             return [ sprintf("%d", random.randint(0,65535)) |  | ||||||
|                      for x in range(10) ] |  | ||||||
|         do_speedtest("uint16_10", datagen) |  | ||||||
|  |  | ||||||
|         def datagen(): |  | ||||||
|             return [ sprintf("%d", random.randint(0,65535)) |  | ||||||
|                      for x in range(6) ] |  | ||||||
|         do_speedtest("uint16_6", datagen) |  | ||||||
| @@ -28,9 +28,6 @@ class Test00Nilmdb(object):  # named 00 so it runs first | |||||||
|     def test_NilmDB(self): |     def test_NilmDB(self): | ||||||
|         recursive_unlink(testdb) |         recursive_unlink(testdb) | ||||||
|  |  | ||||||
|         with assert_raises(IOError): |  | ||||||
|             nilmdb.server.NilmDB("/nonexistant-db/foo") |  | ||||||
|  |  | ||||||
|         db = nilmdb.server.NilmDB(testdb) |         db = nilmdb.server.NilmDB(testdb) | ||||||
|         db.close() |         db.close() | ||||||
|         db = nilmdb.server.NilmDB(testdb) |         db = nilmdb.server.NilmDB(testdb) | ||||||
| @@ -93,13 +90,16 @@ class Test00Nilmdb(object):  # named 00 so it runs first | |||||||
|         eq_(db.stream_get_metadata("/newton/prep"), meta1) |         eq_(db.stream_get_metadata("/newton/prep"), meta1) | ||||||
|         eq_(db.stream_get_metadata("/newton/raw"), meta1) |         eq_(db.stream_get_metadata("/newton/raw"), meta1) | ||||||
|  |  | ||||||
|         # fill in some test coverage for start >= end |         # fill in some misc. test coverage | ||||||
|         with assert_raises(nilmdb.server.NilmDBError): |         with assert_raises(nilmdb.server.NilmDBError): | ||||||
|             db.stream_remove("/newton/prep", 0, 0) |             db.stream_remove("/newton/prep", 0, 0) | ||||||
|         with assert_raises(nilmdb.server.NilmDBError): |         with assert_raises(nilmdb.server.NilmDBError): | ||||||
|             db.stream_remove("/newton/prep", 1, 0) |             db.stream_remove("/newton/prep", 1, 0) | ||||||
|         db.stream_remove("/newton/prep", 0, 1) |         db.stream_remove("/newton/prep", 0, 1) | ||||||
|  |  | ||||||
|  |         with assert_raises(nilmdb.server.NilmDBError): | ||||||
|  |             db.stream_extract("/newton/prep", count = True, binary = True) | ||||||
|  |  | ||||||
|         db.close() |         db.close() | ||||||
|  |  | ||||||
| class TestBlockingServer(object): | class TestBlockingServer(object): | ||||||
| @@ -157,11 +157,14 @@ class TestServer(object): | |||||||
|  |  | ||||||
|     def test_server(self): |     def test_server(self): | ||||||
|         # Make sure we can't force an exit, and test other 404 errors |         # Make sure we can't force an exit, and test other 404 errors | ||||||
|         for url in [ "/exit", "/", "/favicon.ico" ]: |         for url in [ "/exit", "/favicon.ico" ]: | ||||||
|             with assert_raises(HTTPError) as e: |             with assert_raises(HTTPError) as e: | ||||||
|                 geturl(url) |                 geturl(url) | ||||||
|             eq_(e.exception.code, 404) |             eq_(e.exception.code, 404) | ||||||
|  |  | ||||||
|  |         # Root page | ||||||
|  |         in_("This is NilmDB", geturl("/")) | ||||||
|  |  | ||||||
|         # Check version |         # Check version | ||||||
|         eq_(distutils.version.LooseVersion(getjson("/version")), |         eq_(distutils.version.LooseVersion(getjson("/version")), | ||||||
|             distutils.version.LooseVersion(nilmdb.__version__)) |             distutils.version.LooseVersion(nilmdb.__version__)) | ||||||
|   | |||||||
							
								
								
									
										373
									
								
								tests/test_numpyclient.py
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										373
									
								
								tests/test_numpyclient.py
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,373 @@ | |||||||
|  | # -*- coding: utf-8 -*- | ||||||
|  |  | ||||||
|  | import nilmdb.server | ||||||
|  | import nilmdb.client | ||||||
|  | import nilmdb.client.numpyclient | ||||||
|  |  | ||||||
|  | from nilmdb.utils.printf import * | ||||||
|  | from nilmdb.utils import timestamper | ||||||
|  | from nilmdb.client import ClientError, ServerError | ||||||
|  | from nilmdb.utils import datetime_tz | ||||||
|  |  | ||||||
|  | from nose.plugins.skip import SkipTest | ||||||
|  | from nose.tools import * | ||||||
|  | from nose.tools import assert_raises | ||||||
|  | import itertools | ||||||
|  | import distutils.version | ||||||
|  |  | ||||||
|  | from testutil.helpers import * | ||||||
|  |  | ||||||
|  | import numpy as np | ||||||
|  |  | ||||||
|  | testdb = "tests/numpyclient-testdb" | ||||||
|  | testurl = "http://localhost:32180/" | ||||||
|  |  | ||||||
|  | def setup_module(): | ||||||
|  |     global test_server, test_db | ||||||
|  |     # Clear out DB | ||||||
|  |     recursive_unlink(testdb) | ||||||
|  |  | ||||||
|  |     # Start web app on a custom port | ||||||
|  |     test_db = nilmdb.utils.serializer_proxy(nilmdb.server.NilmDB)( | ||||||
|  |         testdb, bulkdata_args = { "file_size" : 16384, | ||||||
|  |                                   "files_per_dir" : 3 } ) | ||||||
|  |  | ||||||
|  |     test_server = nilmdb.server.Server(test_db, host = "127.0.0.1", | ||||||
|  |                                        port = 32180, stoppable = False, | ||||||
|  |                                        fast_shutdown = True, | ||||||
|  |                                        force_traceback = True) | ||||||
|  |     test_server.start(blocking = False) | ||||||
|  |  | ||||||
|  | def teardown_module(): | ||||||
|  |     global test_server, test_db | ||||||
|  |     # Close web app | ||||||
|  |     test_server.stop() | ||||||
|  |     test_db.close() | ||||||
|  |  | ||||||
|  | class TestNumpyClient(object): | ||||||
|  |  | ||||||
|  |     def test_numpyclient_01_basic(self): | ||||||
|  |         # Test basic connection | ||||||
|  |         client = nilmdb.client.numpyclient.NumpyClient(url = testurl) | ||||||
|  |         version = client.version() | ||||||
|  |         eq_(distutils.version.LooseVersion(version), | ||||||
|  |             distutils.version.LooseVersion(test_server.version)) | ||||||
|  |  | ||||||
|  |         # Verify subclassing | ||||||
|  |         assert(isinstance(client, nilmdb.client.Client)) | ||||||
|  |  | ||||||
|  |         # Layouts | ||||||
|  |         for layout in "int8_t", "something_8", "integer_1": | ||||||
|  |             with assert_raises(ValueError): | ||||||
|  |                 for x in client.stream_extract_numpy("/foo", layout=layout): | ||||||
|  |                     pass | ||||||
|  |         for layout in "int8_1", "uint8_30", "int16_20", "float64_100": | ||||||
|  |             with assert_raises(ClientError) as e: | ||||||
|  |                 for x in client.stream_extract_numpy("/foo", layout=layout): | ||||||
|  |                     pass | ||||||
|  |             in_("No such stream", str(e.exception)) | ||||||
|  |  | ||||||
|  |         with assert_raises(ClientError) as e: | ||||||
|  |             for x in client.stream_extract_numpy("/foo"): | ||||||
|  |                 pass | ||||||
|  |         in_("can't get layout for path", str(e.exception)) | ||||||
|  |  | ||||||
|  |         client.close() | ||||||
|  |  | ||||||
|  |     def test_numpyclient_02_extract(self): | ||||||
|  |         client = nilmdb.client.numpyclient.NumpyClient(url = testurl) | ||||||
|  |  | ||||||
|  |         # Insert some data as text | ||||||
|  |         client.stream_create("/newton/prep", "float32_8") | ||||||
|  |         testfile = "tests/data/prep-20120323T1000" | ||||||
|  |         start = nilmdb.utils.time.parse_time("20120323T1000") | ||||||
|  |         rate = 120 | ||||||
|  |         data = timestamper.TimestamperRate(testfile, start, rate) | ||||||
|  |         result = client.stream_insert("/newton/prep", data, | ||||||
|  |                                       start, start + 119999777) | ||||||
|  |  | ||||||
|  |         # Extract Numpy arrays | ||||||
|  |         array = None | ||||||
|  |         pieces = 0 | ||||||
|  |         for chunk in client.stream_extract_numpy("/newton/prep", maxrows=1000): | ||||||
|  |             pieces += 1 | ||||||
|  |             if array is not None: | ||||||
|  |                 array = np.vstack((array, chunk)) | ||||||
|  |             else: | ||||||
|  |                 array = chunk | ||||||
|  |         eq_(array.shape, (14400, 9)) | ||||||
|  |         eq_(pieces, 15) | ||||||
|  |  | ||||||
|  |         # Try structured | ||||||
|  |         s = list(client.stream_extract_numpy("/newton/prep", structured = True)) | ||||||
|  |         assert(np.array_equal(np.c_[s[0]['timestamp'], s[0]['data']], array)) | ||||||
|  |  | ||||||
|  |         # Compare.  Will be close but not exact because the conversion | ||||||
|  |         # to and from ASCII was lossy. | ||||||
|  |         data = timestamper.TimestamperRate(testfile, start, rate) | ||||||
|  |         actual = np.fromstring(" ".join(data), sep=' ').reshape(14400, 9) | ||||||
|  |         assert(np.allclose(array, actual)) | ||||||
|  |  | ||||||
|  |         client.close() | ||||||
|  |  | ||||||
|  |     def test_numpyclient_03_insert(self): | ||||||
|  |         client = nilmdb.client.numpyclient.NumpyClient(url = testurl) | ||||||
|  |  | ||||||
|  |         # Limit _max_data just to get better coverage | ||||||
|  |         old_max_data = nilmdb.client.numpyclient.StreamInserterNumpy._max_data | ||||||
|  |         nilmdb.client.numpyclient.StreamInserterNumpy._max_data = 100000 | ||||||
|  |  | ||||||
|  |         client.stream_create("/test/1", "uint16_1") | ||||||
|  |         client.stream_insert_numpy("/test/1", | ||||||
|  |                                    np.array([[0, 1], | ||||||
|  |                                              [1, 2], | ||||||
|  |                                              [2, 3], | ||||||
|  |                                              [3, 4]])) | ||||||
|  |  | ||||||
|  |         # Wrong number of dimensions | ||||||
|  |         with assert_raises(ValueError) as e: | ||||||
|  |             client.stream_insert_numpy("/test/1", | ||||||
|  |                                        np.array([[[0, 1], | ||||||
|  |                                                   [1, 2]], | ||||||
|  |                                                  [[3, 4], | ||||||
|  |                                                   [4, 5]]])) | ||||||
|  |         in_("wrong number of dimensions", str(e.exception)) | ||||||
|  |  | ||||||
|  |         # Wrong number of fields | ||||||
|  |         with assert_raises(ValueError) as e: | ||||||
|  |             client.stream_insert_numpy("/test/1", | ||||||
|  |                                        np.array([[0, 1, 2], | ||||||
|  |                                                  [1, 2, 3], | ||||||
|  |                                                  [3, 4, 5], | ||||||
|  |                                                  [4, 5, 6]])) | ||||||
|  |         in_("wrong number of fields", str(e.exception)) | ||||||
|  |  | ||||||
|  |         # Unstructured | ||||||
|  |         client.stream_create("/test/2", "float32_8") | ||||||
|  |         client.stream_insert_numpy( | ||||||
|  |             "/test/2", | ||||||
|  |             client.stream_extract_numpy( | ||||||
|  |                 "/newton/prep", structured = False, maxrows = 1000)) | ||||||
|  |  | ||||||
|  |         # Structured, and specifying layout | ||||||
|  |         client.stream_create("/test/3", "float32_8") | ||||||
|  |         client.stream_insert_numpy( | ||||||
|  |             path = "/test/3", layout = "float32_8", | ||||||
|  |             data = client.stream_extract_numpy( | ||||||
|  |                 "/newton/prep", structured = True, maxrows = 1000)) | ||||||
|  |  | ||||||
|  |         # Structured, specifying wrong layout | ||||||
|  |         client.stream_create("/test/4", "float32_8") | ||||||
|  |         with assert_raises(ValueError) as e: | ||||||
|  |             client.stream_insert_numpy( | ||||||
|  |                 "/test/4", layout = "uint16_1", | ||||||
|  |                 data = client.stream_extract_numpy( | ||||||
|  |                     "/newton/prep", structured = True, maxrows = 1000)) | ||||||
|  |         in_("wrong dtype", str(e.exception)) | ||||||
|  |  | ||||||
|  |         # Unstructured, and specifying wrong layout | ||||||
|  |         client.stream_create("/test/5", "float32_8") | ||||||
|  |         with assert_raises(ClientError) as e: | ||||||
|  |             client.stream_insert_numpy( | ||||||
|  |                 "/test/5", layout = "uint16_8", | ||||||
|  |                 data = client.stream_extract_numpy( | ||||||
|  |                     "/newton/prep", structured = False, maxrows = 1000)) | ||||||
|  |         # timestamps will be screwy here, because data will be parsed wrong | ||||||
|  |         in_("error parsing input data", str(e.exception)) | ||||||
|  |  | ||||||
|  |         # Make sure the /newton/prep copies are identical | ||||||
|  |         a = np.vstack(client.stream_extract_numpy("/newton/prep")) | ||||||
|  |         b = np.vstack(client.stream_extract_numpy("/test/2")) | ||||||
|  |         c = np.vstack(client.stream_extract_numpy("/test/3")) | ||||||
|  |         assert(np.array_equal(a,b)) | ||||||
|  |         assert(np.array_equal(a,c)) | ||||||
|  |  | ||||||
|  |         # Make sure none of the files are greater than 16384 bytes as | ||||||
|  |         # we configured with the bulkdata_args above. | ||||||
|  |         datapath = os.path.join(testdb, "data") | ||||||
|  |         for (dirpath, dirnames, filenames) in os.walk(datapath): | ||||||
|  |             for f in filenames: | ||||||
|  |                 fn = os.path.join(dirpath, f) | ||||||
|  |                 size = os.path.getsize(fn) | ||||||
|  |                 if size > 16384: | ||||||
|  |                     raise AssertionError(sprintf("%s is too big: %d > %d\n", | ||||||
|  |                                                  fn, size, 16384)) | ||||||
|  |  | ||||||
|  |         nilmdb.client.numpyclient.StreamInserterNumpy._max_data = old_max_data | ||||||
|  |         client.close() | ||||||
|  |  | ||||||
|  |     def test_numpyclient_04_context(self): | ||||||
|  |         # Like test_client_context, but with Numpy data | ||||||
|  |         client = nilmdb.client.numpyclient.NumpyClient(testurl) | ||||||
|  |  | ||||||
|  |         client.stream_create("/context/test", "uint16_1") | ||||||
|  |         with client.stream_insert_numpy_context("/context/test") as ctx: | ||||||
|  |             # override _max_rows to trigger frequent server updates | ||||||
|  |             ctx._max_rows = 2 | ||||||
|  |             ctx.insert([[1000, 1]]) | ||||||
|  |             ctx.insert([[1010, 1], [1020, 1], [1030, 1]]) | ||||||
|  |             ctx.insert([[1040, 1], [1050, 1]]) | ||||||
|  |             ctx.finalize() | ||||||
|  |             ctx.insert([[1070, 1]]) | ||||||
|  |             ctx.update_end(1080) | ||||||
|  |             ctx.finalize() | ||||||
|  |             ctx.update_start(1090) | ||||||
|  |             ctx.insert([[1100, 1]]) | ||||||
|  |             ctx.insert([[1110, 1]]) | ||||||
|  |             ctx.send() | ||||||
|  |             ctx.insert([[1120, 1], [1130, 1], [1140, 1]]) | ||||||
|  |             ctx.update_end(1160) | ||||||
|  |             ctx.insert([[1150, 1]]) | ||||||
|  |             ctx.update_end(1170) | ||||||
|  |             ctx.insert([[1160, 1]]) | ||||||
|  |             ctx.update_end(1180) | ||||||
|  |             ctx.insert([[1170, 123456789.0]]) | ||||||
|  |             ctx.finalize() | ||||||
|  |             ctx.insert(np.zeros((0,2))) | ||||||
|  |  | ||||||
|  |         with assert_raises(ClientError): | ||||||
|  |             with client.stream_insert_numpy_context("/context/test", | ||||||
|  |                                                     1000, 2000) as ctx: | ||||||
|  |                 ctx.insert([[1180, 1]]) | ||||||
|  |  | ||||||
|  |         with assert_raises(ClientError): | ||||||
|  |             with client.stream_insert_numpy_context("/context/test", | ||||||
|  |                                                     2000, 3000) as ctx: | ||||||
|  |                 ctx._max_rows = 2 | ||||||
|  |                 ctx.insert([[3180, 1]]) | ||||||
|  |                 ctx.insert([[3181, 1]]) | ||||||
|  |  | ||||||
|  |         with client.stream_insert_numpy_context("/context/test", | ||||||
|  |                                                 2000, 3000) as ctx: | ||||||
|  |             # make sure our override wasn't permanent | ||||||
|  |             ne_(ctx._max_rows, 2) | ||||||
|  |             ctx.insert([[2250, 1]]) | ||||||
|  |             ctx.finalize() | ||||||
|  |  | ||||||
|  |         with assert_raises(ClientError): | ||||||
|  |             with client.stream_insert_numpy_context("/context/test", | ||||||
|  |                                                     3000, 4000) as ctx: | ||||||
|  |                 ctx.insert([[3010, 1]]) | ||||||
|  |                 ctx.insert([[3020, 2]]) | ||||||
|  |                 ctx.insert([[3030, 3]]) | ||||||
|  |                 ctx.insert([[3040, 4]]) | ||||||
|  |                 ctx.insert([[3040, 4]]) # non-monotonic after a few lines | ||||||
|  |                 ctx.finalize() | ||||||
|  |  | ||||||
|  |         eq_(list(client.stream_intervals("/context/test")), | ||||||
|  |             [ [ 1000, 1051 ], | ||||||
|  |               [ 1070, 1080 ], | ||||||
|  |               [ 1090, 1180 ], | ||||||
|  |               [ 2000, 3000 ] ]) | ||||||
|  |  | ||||||
|  |         client.stream_remove("/context/test") | ||||||
|  |         client.stream_destroy("/context/test") | ||||||
|  |         client.close() | ||||||
|  |  | ||||||
|  |     def test_numpyclient_05_emptyintervals(self): | ||||||
|  |         # Like test_client_emptyintervals, with insert_numpy_context | ||||||
|  |         client = nilmdb.client.numpyclient.NumpyClient(testurl) | ||||||
|  |         client.stream_create("/empty/test", "uint16_1") | ||||||
|  |         def info(): | ||||||
|  |             result = [] | ||||||
|  |             for interval in list(client.stream_intervals("/empty/test")): | ||||||
|  |                 result.append((client.stream_count("/empty/test", *interval), | ||||||
|  |                                interval)) | ||||||
|  |             return result | ||||||
|  |         eq_(info(), []) | ||||||
|  |  | ||||||
|  |         # Insert a region with just a few points | ||||||
|  |         with client.stream_insert_numpy_context("/empty/test") as ctx: | ||||||
|  |             ctx.update_start(100) | ||||||
|  |             ctx.insert([[140, 1]]) | ||||||
|  |             ctx.insert([[150, 1]]) | ||||||
|  |             ctx.insert([[160, 1]]) | ||||||
|  |             ctx.update_end(200) | ||||||
|  |             ctx.finalize() | ||||||
|  |         eq_(info(), [(3, [100, 200])]) | ||||||
|  |  | ||||||
|  |         # Delete chunk, which will leave one data point and two intervals | ||||||
|  |         client.stream_remove("/empty/test", 145, 175) | ||||||
|  |         eq_(info(), [(1, [100, 145]), | ||||||
|  |                      (0, [175, 200])]) | ||||||
|  |  | ||||||
|  |         # Try also creating a completely empty interval from scratch, | ||||||
|  |         # in a few different ways. | ||||||
|  |         client.stream_insert("/empty/test", "", 300, 350) | ||||||
|  |         client.stream_insert("/empty/test", [], 400, 450) | ||||||
|  |         with client.stream_insert_numpy_context("/empty/test", 500, 550): | ||||||
|  |             pass | ||||||
|  |  | ||||||
|  |         # If enough timestamps aren't provided, empty streams won't be created. | ||||||
|  |         client.stream_insert("/empty/test", []) | ||||||
|  |         with client.stream_insert_numpy_context("/empty/test"): | ||||||
|  |             pass | ||||||
|  |         client.stream_insert("/empty/test", [], start = 600) | ||||||
|  |         with client.stream_insert_numpy_context("/empty/test", start = 700): | ||||||
|  |             pass | ||||||
|  |         client.stream_insert("/empty/test", [], end = 850) | ||||||
|  |         with client.stream_insert_numpy_context("/empty/test", end = 950): | ||||||
|  |             pass | ||||||
|  |  | ||||||
|  |         # Equal start and end is OK as long as there's no data | ||||||
|  |         with assert_raises(ClientError) as e: | ||||||
|  |             with client.stream_insert_numpy_context("/empty/test", | ||||||
|  |                                                     start=9, end=9) as ctx: | ||||||
|  |                 ctx.insert([[9, 9]]) | ||||||
|  |                 ctx.finalize() | ||||||
|  |         in_("have data to send, but invalid start/end times", str(e.exception)) | ||||||
|  |  | ||||||
|  |         with client.stream_insert_numpy_context("/empty/test", | ||||||
|  |                                                 start=9, end=9) as ctx: | ||||||
|  |             pass | ||||||
|  |  | ||||||
|  |         # reusing a context object is bad | ||||||
|  |         with assert_raises(Exception) as e: | ||||||
|  |             ctx.insert([[9, 9]]) | ||||||
|  |  | ||||||
|  |         # Try various things that might cause problems | ||||||
|  |         with client.stream_insert_numpy_context("/empty/test", | ||||||
|  |                                                 1000, 1050) as ctx: | ||||||
|  |             ctx.finalize() # inserts [1000, 1050] | ||||||
|  |             ctx.finalize() # nothing | ||||||
|  |             ctx.finalize() # nothing | ||||||
|  |             ctx.insert([[1100, 1]]) | ||||||
|  |             ctx.finalize() # inserts [1100, 1101] | ||||||
|  |             ctx.update_start(1199) | ||||||
|  |             ctx.insert([[1200, 1]]) | ||||||
|  |             ctx.update_end(1250) | ||||||
|  |             ctx.finalize() # inserts [1199, 1250] | ||||||
|  |             ctx.update_start(1299) | ||||||
|  |             ctx.finalize() # nothing | ||||||
|  |             ctx.update_end(1350) | ||||||
|  |             ctx.finalize() # nothing | ||||||
|  |             ctx.update_start(1400) | ||||||
|  |             ctx.insert(np.zeros((0,2))) | ||||||
|  |             ctx.update_end(1450) | ||||||
|  |             ctx.finalize() | ||||||
|  |             ctx.update_start(1500) | ||||||
|  |             ctx.insert(np.zeros((0,2))) | ||||||
|  |             ctx.update_end(1550) | ||||||
|  |             ctx.finalize() | ||||||
|  |             ctx.insert(np.zeros((0,2))) | ||||||
|  |             ctx.insert(np.zeros((0,2))) | ||||||
|  |             ctx.insert(np.zeros((0,2))) | ||||||
|  |             ctx.finalize() | ||||||
|  |  | ||||||
|  |         # Check everything | ||||||
|  |         eq_(info(), [(1, [100, 145]), | ||||||
|  |                      (0, [175, 200]), | ||||||
|  |                      (0, [300, 350]), | ||||||
|  |                      (0, [400, 450]), | ||||||
|  |                      (0, [500, 550]), | ||||||
|  |                      (0, [1000, 1050]), | ||||||
|  |                      (1, [1100, 1101]), | ||||||
|  |                      (1, [1199, 1250]), | ||||||
|  |                      (0, [1400, 1450]), | ||||||
|  |                      (0, [1500, 1550]), | ||||||
|  |                      ]) | ||||||
|  |  | ||||||
|  |         # Clean up | ||||||
|  |         client.stream_remove("/empty/test") | ||||||
|  |         client.stream_destroy("/empty/test") | ||||||
|  |         client.close() | ||||||
| @@ -18,7 +18,7 @@ class TestPrintf(object): | |||||||
|             printf("hello, world: %d", 123) |             printf("hello, world: %d", 123) | ||||||
|             fprintf(test2, "hello too: %d", 123) |             fprintf(test2, "hello too: %d", 123) | ||||||
|             test3 = sprintf("hello three: %d", 123) |             test3 = sprintf("hello three: %d", 123) | ||||||
|         except: |         except Exception: | ||||||
|             sys.stdout = old_stdout |             sys.stdout = old_stdout | ||||||
|             raise |             raise | ||||||
|         sys.stdout = old_stdout |         sys.stdout = old_stdout | ||||||
|   | |||||||
| @@ -62,6 +62,28 @@ class Base(object): | |||||||
|         eq_(self.foo.val, 20) |         eq_(self.foo.val, 20) | ||||||
|         eq_(self.foo.init_thread, self.foo.test_thread) |         eq_(self.foo.init_thread, self.foo.test_thread) | ||||||
|  |  | ||||||
|  | class ListLike(object): | ||||||
|  |     def __init__(self): | ||||||
|  |         self.thread = threading.current_thread().name | ||||||
|  |         self.foo = 0 | ||||||
|  |  | ||||||
|  |     def __iter__(self): | ||||||
|  |         eq_(threading.current_thread().name, self.thread) | ||||||
|  |         self.foo = 0 | ||||||
|  |         return self | ||||||
|  |  | ||||||
|  |     def __getitem__(self, key): | ||||||
|  |         eq_(threading.current_thread().name, self.thread) | ||||||
|  |         return key | ||||||
|  |  | ||||||
|  |     def next(self): | ||||||
|  |         eq_(threading.current_thread().name, self.thread) | ||||||
|  |         if self.foo < 5: | ||||||
|  |             self.foo += 1 | ||||||
|  |             return self.foo | ||||||
|  |         else: | ||||||
|  |             raise StopIteration | ||||||
|  |  | ||||||
| class TestUnserialized(Base): | class TestUnserialized(Base): | ||||||
|     def setUp(self): |     def setUp(self): | ||||||
|         self.foo = Foo() |         self.foo = Foo() | ||||||
| @@ -84,3 +106,9 @@ class TestSerializer(Base): | |||||||
|         sp(sp(Foo("x"))).t() |         sp(sp(Foo("x"))).t() | ||||||
|         sp(sp(Foo)("x")).t() |         sp(sp(Foo)("x")).t() | ||||||
|         sp(sp(Foo))("x").t() |         sp(sp(Foo))("x").t() | ||||||
|  |  | ||||||
|  |     def test_iter(self): | ||||||
|  |         sp = nilmdb.utils.serializer_proxy | ||||||
|  |         i = sp(ListLike)() | ||||||
|  |         eq_(list(i), [1,2,3,4,5]) | ||||||
|  |         eq_(i[3], 3) | ||||||
|   | |||||||
| @@ -1,419 +0,0 @@ | |||||||
|  |  | ||||||
| #----------------------------------------------- |  | ||||||
| #aplotter.py - ascii art function plotter |  | ||||||
| #Copyright (c) 2006, Imri Goldberg |  | ||||||
| #All rights reserved. |  | ||||||
| # |  | ||||||
| #Redistribution and use in source and binary forms, |  | ||||||
| #with or without modification, are permitted provided |  | ||||||
| #that the following conditions are met: |  | ||||||
| # |  | ||||||
| #    * Redistributions of source code must retain the |  | ||||||
| #		above copyright notice, this list of conditions |  | ||||||
| #		and the following disclaimer. |  | ||||||
| #    * Redistributions in binary form must reproduce the |  | ||||||
| #		above copyright notice, this list of conditions |  | ||||||
| #		and the following disclaimer in the documentation |  | ||||||
| #		and/or other materials provided with the distribution. |  | ||||||
| #    * Neither the name of the <ORGANIZATION> nor the names of |  | ||||||
| #		its contributors may be used to endorse or promote products |  | ||||||
| #		derived from this software without specific prior written permission. |  | ||||||
| # |  | ||||||
| #THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" |  | ||||||
| #AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE |  | ||||||
| #IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE |  | ||||||
| #ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE |  | ||||||
| #LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL |  | ||||||
| #DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR |  | ||||||
| #SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER |  | ||||||
| #CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, |  | ||||||
| #OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE |  | ||||||
| #OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |  | ||||||
| #----------------------------------------------- |  | ||||||
|  |  | ||||||
| import math |  | ||||||
|  |  | ||||||
|  |  | ||||||
| EPSILON = 0.000001 |  | ||||||
|  |  | ||||||
| def transposed(mat): |  | ||||||
| 	result = [] |  | ||||||
| 	for i in xrange(len(mat[0])): |  | ||||||
| 		result.append([x[i] for x in mat]) |  | ||||||
| 	return result |  | ||||||
|  |  | ||||||
| def y_reversed(mat):     |  | ||||||
| 	result = [] |  | ||||||
| 	for i in range(len(mat)): |  | ||||||
| 		result.append(list(reversed(mat[i]))) |  | ||||||
| 	return result |  | ||||||
|  |  | ||||||
| def sign(x): |  | ||||||
| 	if 0<x: |  | ||||||
| 		return 1 |  | ||||||
| 	if 0 == x: |  | ||||||
| 		return 0 |  | ||||||
| 	return -1 |  | ||||||
|  |  | ||||||
| class Plotter(object): |  | ||||||
|  |  | ||||||
| 	class PlotData(object): |  | ||||||
| 		def __init__(self, x_size, y_size, min_x, max_x, min_y, max_y, x_mod, y_mod): |  | ||||||
| 			self.x_size = x_size |  | ||||||
| 			self.y_size = y_size |  | ||||||
| 			self.min_x = min_x |  | ||||||
| 			self.max_x = max_x |  | ||||||
| 			self.min_y = min_y |  | ||||||
| 			self.max_y = max_y |  | ||||||
| 			self.x_mod = x_mod |  | ||||||
| 			self.y_mod = y_mod |  | ||||||
|  |  | ||||||
| 			self.x_step = float(max_x - min_x)/float(self.x_size) |  | ||||||
| 			self.y_step = float(max_y - min_y)/float(self.y_size) |  | ||||||
| 			self.inv_x_step = 1/self.x_step |  | ||||||
| 			self.inv_y_step = 1/self.y_step |  | ||||||
|  |  | ||||||
| 			self.ratio = self.y_step / self.x_step |  | ||||||
| 		def __repr__(self): |  | ||||||
| 			s = "size: %s, bl: %s, tr: %s, step: %s" % ((self.x_size, self.y_size), (self.min_x, self.min_y), (self.max_x, self.max_y), |  | ||||||
| 														 (self.x_step, self.y_step)) |  | ||||||
| 			return s |  | ||||||
| 	 |  | ||||||
| 	def __init__(self, **kwargs): |  | ||||||
|  |  | ||||||
| 		self.x_size = kwargs.get("x_size", 80) |  | ||||||
| 		self.y_size = kwargs.get("y_size", 20) |  | ||||||
|  |  | ||||||
| 		self.will_draw_axes = kwargs.get("draw_axes", True) |  | ||||||
|  |  | ||||||
| 		self.new_line = kwargs.get("newline", "\n") |  | ||||||
|  |  | ||||||
| 		self.dot = kwargs.get("dot", "*") |  | ||||||
|  |  | ||||||
| 		self.plot_slope = kwargs.get("plot_slope", True) |  | ||||||
|  |  | ||||||
| 		self.x_margin = kwargs.get("x_margin", 0.05) |  | ||||||
| 		self.y_margin = kwargs.get("y_margin", 0.1) |  | ||||||
|  |  | ||||||
| 		self.will_plot_labels = kwargs.get("plot_labels", True) |  | ||||||
|  |  | ||||||
| 	@staticmethod |  | ||||||
| 	def get_symbol_by_slope(slope, default_symbol): |  | ||||||
| 		draw_symbol = default_symbol |  | ||||||
| 		if slope > math.tan(3*math.pi/8): |  | ||||||
| 			draw_symbol = "|" |  | ||||||
| 		elif slope > math.tan(math.pi/8) and slope < math.tan(3*math.pi/8): |  | ||||||
| 			draw_symbol = "/" |  | ||||||
| 		elif abs(slope) < math.tan(math.pi/8): |  | ||||||
| 			draw_symbol = "-" |  | ||||||
| 		elif slope < math.tan(-math.pi/8) and slope > math.tan(-3*math.pi/8): |  | ||||||
| 			draw_symbol = "\\" |  | ||||||
| 		elif slope < math.tan(-3*math.pi/8): |  | ||||||
| 			draw_symbol = "|" |  | ||||||
| 		return draw_symbol     |  | ||||||
|  |  | ||||||
|  |  | ||||||
| 	def plot_labels(self, output_buffer, plot_data): |  | ||||||
| 		if plot_data.y_size < 2: |  | ||||||
| 			return |  | ||||||
|  |  | ||||||
| 		margin_factor = 1 |  | ||||||
|  |  | ||||||
| 		do_plot_x_label = True |  | ||||||
| 		do_plot_y_label = True |  | ||||||
|  |  | ||||||
| 		x_str = "%+g" |  | ||||||
| 		if plot_data.x_size < 16: |  | ||||||
| 			do_plot_x_label = False |  | ||||||
| 		elif plot_data.x_size < 23: |  | ||||||
| 			x_str = "%+.2g"  |  | ||||||
|  |  | ||||||
| 		y_str = "%+g"     |  | ||||||
| 		if plot_data.x_size < 8: |  | ||||||
| 			do_plot_y_label = False |  | ||||||
| 		elif plot_data.x_size < 11: |  | ||||||
| 			y_str = "%+.2g" |  | ||||||
| 			 |  | ||||||
| 		act_min_x = (plot_data.min_x + plot_data.x_mod*margin_factor) |  | ||||||
| 		act_max_x = (plot_data.max_x - plot_data.x_mod*margin_factor) |  | ||||||
| 		act_min_y = (plot_data.min_y + plot_data.y_mod*margin_factor) |  | ||||||
| 		act_max_y = (plot_data.max_y - plot_data.y_mod*margin_factor) |  | ||||||
|  |  | ||||||
| 		if abs(act_min_x) < 1: |  | ||||||
| 			min_x_str = "%+.2g" % act_min_x |  | ||||||
| 		else: |  | ||||||
| 			min_x_str = x_str % act_min_x |  | ||||||
|  |  | ||||||
| 		if abs(act_max_x) < 1: |  | ||||||
| 			max_x_str = "%+.2g" % act_max_x |  | ||||||
| 		else: |  | ||||||
| 			max_x_str = x_str % act_max_x |  | ||||||
| 		 |  | ||||||
| 		if abs(act_min_y) < 1: |  | ||||||
| 			min_y_str = "%+.2g" % act_min_y |  | ||||||
| 		else: |  | ||||||
| 			min_y_str = y_str % act_min_y |  | ||||||
|  |  | ||||||
| 		if abs(act_max_y) < 1: |  | ||||||
| 			max_y_str = "%+.2g" % act_max_y |  | ||||||
| 		else: |  | ||||||
| 			max_y_str = y_str % act_max_y |  | ||||||
| 						  |  | ||||||
| 		min_x_coord = self.get_coord(act_min_x,plot_data.min_x,plot_data.x_step) |  | ||||||
| 		max_x_coord = self.get_coord(act_max_x,plot_data.min_x,plot_data.x_step) |  | ||||||
| 		min_y_coord = self.get_coord(act_min_y,plot_data.min_y,plot_data.y_step) |  | ||||||
| 		max_y_coord = self.get_coord(act_max_y,plot_data.min_y,plot_data.y_step) |  | ||||||
| 								  |  | ||||||
|  |  | ||||||
| 		#print plot_data |  | ||||||
| 		 |  | ||||||
| 		y_zero_coord = self.get_coord(0, plot_data.min_y, plot_data.y_step) |  | ||||||
|  |  | ||||||
| 		#if plot_data.min_x < 0 and plot_data.max_x > 0: |  | ||||||
| 		x_zero_coord = self.get_coord(0, plot_data.min_x, plot_data.x_step) |  | ||||||
| 		#else: |  | ||||||
| 		 |  | ||||||
| 		#pass |  | ||||||
|  |  | ||||||
| 		output_buffer[x_zero_coord][min_y_coord] = "+" |  | ||||||
| 		output_buffer[x_zero_coord][max_y_coord] = "+" |  | ||||||
| 		output_buffer[min_x_coord][y_zero_coord] = "+" |  | ||||||
| 		output_buffer[max_x_coord][y_zero_coord] = "+" |  | ||||||
|  |  | ||||||
| 		if do_plot_x_label:         |  | ||||||
|  |  | ||||||
| 			for i,c in enumerate(min_x_str): |  | ||||||
| 				output_buffer[min_x_coord+i][y_zero_coord-1] = c |  | ||||||
| 			for i,c in enumerate(max_x_str): |  | ||||||
| 				output_buffer[max_x_coord+i-len(max_x_str)][y_zero_coord-1] = c |  | ||||||
|  |  | ||||||
| 		if do_plot_y_label: |  | ||||||
|  |  | ||||||
| 			for i,c in enumerate(max_y_str): |  | ||||||
| 				output_buffer[x_zero_coord+i][max_y_coord] = c |  | ||||||
| 			for i,c in enumerate(min_y_str): |  | ||||||
| 				output_buffer[x_zero_coord+i][min_y_coord] = c |  | ||||||
| 			 |  | ||||||
|  |  | ||||||
| 		 |  | ||||||
| 		 |  | ||||||
| 	 |  | ||||||
| 	def plot_data(self, xy_seq, output_buffer, plot_data): |  | ||||||
| 		if self.plot_slope: |  | ||||||
| 			xy_seq = list(xy_seq) |  | ||||||
| 			#sort according to the x coord |  | ||||||
| 			xy_seq.sort(key = lambda c: c[0]) |  | ||||||
| 			prev_p = xy_seq[0] |  | ||||||
| 			e_xy_seq = enumerate(xy_seq) |  | ||||||
| 			e_xy_seq.next() |  | ||||||
| 			for i,(x,y) in e_xy_seq: |  | ||||||
| 				draw_symbol = self.dot |  | ||||||
| 				line_drawn = self.plot_line(prev_p, (x,y), output_buffer, plot_data) |  | ||||||
| 				prev_p = (x,y) |  | ||||||
| 				if not line_drawn: |  | ||||||
| 					if i > 0 and i < len(xy_seq)-1: |  | ||||||
| 						px,py = xy_seq[i-1] |  | ||||||
| 						nx,ny = xy_seq[i+1] |  | ||||||
|  |  | ||||||
| 						if abs(nx-px) > EPSILON: |  | ||||||
| 							slope = (1.0/plot_data.ratio)*(ny-py)/(nx-px) |  | ||||||
| 							draw_symbol = self.get_symbol_by_slope(slope, draw_symbol) |  | ||||||
| 					if x < plot_data.min_x or x >= plot_data.max_x or y < plot_data.min_y or y >= plot_data.max_y: |  | ||||||
| 						continue |  | ||||||
| 					 |  | ||||||
| 					x_coord = self.get_coord(x, plot_data.min_x, plot_data.x_step) |  | ||||||
| 					y_coord = self.get_coord(y, plot_data.min_y, plot_data.y_step)             |  | ||||||
| 					if x_coord >= 0 and x_coord < len(output_buffer) and y_coord >= 0 and y_coord < len(output_buffer[0]): |  | ||||||
| 						if self.draw_axes: |  | ||||||
| 							if y_coord == self.get_coord(0, plot_data.min_y, plot_data.y_step) and draw_symbol == "-": |  | ||||||
| 								draw_symbol = "=" |  | ||||||
| 						output_buffer[x_coord][y_coord] = draw_symbol |  | ||||||
| 		else: |  | ||||||
| 			for x,y in xy_seq: |  | ||||||
| 				if x < plot_data.min_x or x >= plot_data.max_x or y < plot_data.min_y or y >= plot_data.max_y: |  | ||||||
| 					continue |  | ||||||
| 				x_coord = self.get_coord(x, plot_data.min_x, plot_data.x_step) |  | ||||||
| 				y_coord = self.get_coord(y, plot_data.min_y, plot_data.y_step) |  | ||||||
| 				if x_coord >= 0 and x_coord < len(output_buffer) and y_coord > 0 and y_coord < len(output_buffer[0]): |  | ||||||
| 					output_buffer[x_coord][y_coord] = self.dot |  | ||||||
|  |  | ||||||
|  |  | ||||||
| 	def plot_line(self, start, end, output_buffer, plot_data): |  | ||||||
|  |  | ||||||
| 		start_coord = self.get_coord(start[0], plot_data.min_x, plot_data.x_step), self.get_coord(start[1], plot_data.min_y, plot_data.y_step) |  | ||||||
| 		end_coord = self.get_coord(end[0], plot_data.min_x, plot_data.x_step), self.get_coord(end[1], plot_data.min_y, plot_data.y_step) |  | ||||||
|  |  | ||||||
| 		x0,y0 = start_coord |  | ||||||
| 		x1,y1 = end_coord |  | ||||||
| 		if (x0,y0) == (x1,y1): |  | ||||||
| 			return True     |  | ||||||
| 		 |  | ||||||
| 		clipped_line = clip_line(start, end, (plot_data.min_x, plot_data.min_y), (plot_data.max_x, plot_data.max_y)) |  | ||||||
| 		if clipped_line != None: |  | ||||||
| 			start,end = clipped_line |  | ||||||
| 		else: |  | ||||||
| 			return False |  | ||||||
| 		start_coord = self.get_coord(start[0], plot_data.min_x, plot_data.x_step), self.get_coord(start[1], plot_data.min_y, plot_data.y_step) |  | ||||||
| 		end_coord = self.get_coord(end[0], plot_data.min_x, plot_data.x_step), self.get_coord(end[1], plot_data.min_y, plot_data.y_step) |  | ||||||
|  |  | ||||||
| 		x0,y0 = start_coord |  | ||||||
| 		x1,y1 = end_coord |  | ||||||
| 		if (x0,y0) == (x1,y1): |  | ||||||
| 			return True |  | ||||||
| 		x_zero_coord = self.get_coord(0, plot_data.min_x, plot_data.x_step) |  | ||||||
| 		y_zero_coord = self.get_coord(0, plot_data.min_y, plot_data.y_step)    |  | ||||||
|  |  | ||||||
| 		if start[0]-end[0] == 0: |  | ||||||
| 			draw_symbol = "|" |  | ||||||
| 		else: |  | ||||||
| 			slope = (1.0/plot_data.ratio)*(end[1]-start[1])/(end[0]-start[0]) |  | ||||||
| 			draw_symbol = self.get_symbol_by_slope(slope, self.dot) |  | ||||||
| 		try: |  | ||||||
|  |  | ||||||
| 			delta = x1-x0, y1-y0 |  | ||||||
| 			if abs(delta[0])>abs(delta[1]): |  | ||||||
| 				s = sign(delta[0]) |  | ||||||
| 				slope = float(delta[1])/delta[0] |  | ||||||
| 				for i in range(0,abs(int(delta[0]))): |  | ||||||
| 					cur_draw_symbol = draw_symbol |  | ||||||
| 					x = i*s |  | ||||||
| 					cur_y = int(y0+slope*x) |  | ||||||
| 					if self.draw_axes and cur_y == y_zero_coord and draw_symbol == "-": |  | ||||||
| 						cur_draw_symbol = "=" |  | ||||||
| 					output_buffer[x0+x][cur_y] = cur_draw_symbol |  | ||||||
| 				 |  | ||||||
| 				 |  | ||||||
| 			else: |  | ||||||
| 				s = sign(delta[1]) |  | ||||||
| 				slope = float(delta[0])/delta[1] |  | ||||||
| 				for i in range(0,abs(int(delta[1]))): |  | ||||||
| 					y = i*s |  | ||||||
| 					cur_draw_symbol = draw_symbol |  | ||||||
| 					cur_y = y0+y |  | ||||||
| 					if self.draw_axes and cur_y == y_zero_coord and draw_symbol == "-": |  | ||||||
| 						cur_draw_symbol = "=" |  | ||||||
| 					output_buffer[int(x0+slope*y)][cur_y] = cur_draw_symbol |  | ||||||
| 		except: |  | ||||||
| 			print start, end |  | ||||||
| 			print start_coord, end_coord |  | ||||||
| 			print plot_data |  | ||||||
| 			raise |  | ||||||
|  |  | ||||||
| 		return False             |  | ||||||
| 		 |  | ||||||
| 		 |  | ||||||
| 	def plot_single(self, seq, min_x = None, max_x = None, min_y = None, max_y = None): |  | ||||||
| 		return self.plot_double(range(len(seq)),seq, min_x, max_x, min_y, max_y) |  | ||||||
| 		 |  | ||||||
|  |  | ||||||
|  |  | ||||||
|  |  | ||||||
| 	def plot_double(self, x_seq, y_seq, min_x = None, max_x = None, min_y = None, max_y = None): |  | ||||||
| 		if min_x == None: |  | ||||||
| 			min_x = min(x_seq) |  | ||||||
| 		if max_x == None: |  | ||||||
| 			max_x = max(x_seq) |  | ||||||
| 		if min_y == None: |  | ||||||
| 			min_y = min(y_seq) |  | ||||||
| 		if max_y == None: |  | ||||||
| 			max_y = max(y_seq) |  | ||||||
|  |  | ||||||
| 		if max_y == min_y: |  | ||||||
| 			max_y += 1 |  | ||||||
|  |  | ||||||
| 		x_mod = (max_x-min_x)*self.x_margin |  | ||||||
| 		y_mod = (max_y-min_y)*self.y_margin |  | ||||||
| 		min_x-=x_mod |  | ||||||
| 		max_x+=x_mod |  | ||||||
| 		min_y-=y_mod |  | ||||||
| 		max_y+=y_mod |  | ||||||
|  |  | ||||||
|  |  | ||||||
| 		plot_data = self.PlotData(self.x_size, self.y_size, min_x, max_x, min_y, max_y, x_mod, y_mod) |  | ||||||
|  |  | ||||||
| 		output_buffer = [[" "]*self.y_size for i in range(self.x_size)] |  | ||||||
|  |  | ||||||
| 		if self.will_draw_axes: |  | ||||||
| 			self.draw_axes(output_buffer, plot_data) |  | ||||||
|  |  | ||||||
| 		self.plot_data(zip(x_seq, y_seq), output_buffer, plot_data) |  | ||||||
|  |  | ||||||
| 		if self.will_plot_labels: |  | ||||||
| 			self.plot_labels(output_buffer, plot_data) |  | ||||||
|  |  | ||||||
| 		trans_result = transposed(y_reversed(output_buffer)) |  | ||||||
|  |  | ||||||
| 		result = self.new_line.join(["".join(row) for row in trans_result]) |  | ||||||
| 		return result |  | ||||||
|  |  | ||||||
| 	def draw_axes(self, output_buffer, plot_data): |  | ||||||
| 		 |  | ||||||
| 		 |  | ||||||
| 		draw_x = False |  | ||||||
| 		draw_y = False |  | ||||||
|  |  | ||||||
| 		if plot_data.min_x <= 0 and plot_data.max_x > 0: |  | ||||||
| 			draw_y = True |  | ||||||
| 			zero_x = self.get_coord(0, plot_data.min_x, plot_data.x_step) |  | ||||||
| 			for y in xrange(plot_data.y_size): |  | ||||||
| 				output_buffer[zero_x][y] = "|" |  | ||||||
| 				 |  | ||||||
| 		if plot_data.min_y <= 0 and plot_data.max_y > 0: |  | ||||||
| 			draw_x = True |  | ||||||
| 			zero_y = self.get_coord(0, plot_data.min_y, plot_data.y_step)     |  | ||||||
| 			for x in xrange(plot_data.x_size): |  | ||||||
| 				output_buffer[x][zero_y] = "-" |  | ||||||
|  |  | ||||||
| 		if draw_x and draw_y: |  | ||||||
| 			output_buffer[zero_x][zero_y] = "+" |  | ||||||
| 		 |  | ||||||
| 		 |  | ||||||
| 	@staticmethod |  | ||||||
| 	def get_coord(val, min, step): |  | ||||||
| 		result = int((val - min)/step) |  | ||||||
| 		return result |  | ||||||
|  |  | ||||||
| def clip_line(line_pt_1, line_pt_2, rect_bottom_left, rect_top_right): |  | ||||||
| 	ts = [0.0,1.0] |  | ||||||
| 	if line_pt_1[0] == line_pt_2[0]: |  | ||||||
| 		return ((line_pt_1[0], max(min(line_pt_1[1], line_pt_2[1]), rect_bottom_left[1])), |  | ||||||
| 				(line_pt_1[0], min(max(line_pt_1[1], line_pt_2[1]), rect_top_right[1]))) |  | ||||||
| 	if line_pt_1[1] == line_pt_2[1]: |  | ||||||
| 		return ((max(min(line_pt_1[0], line_pt_2[0]), rect_bottom_left[0]), line_pt_1[1]), |  | ||||||
| 				(min(max(line_pt_1[0], line_pt_2[0]), rect_top_right[0]), line_pt_1[1])) |  | ||||||
|  |  | ||||||
| 	if ((rect_bottom_left[0] <= line_pt_1[0] and line_pt_1[0] < rect_top_right[0]) and |  | ||||||
| 		(rect_bottom_left[1] <= line_pt_1[1] and line_pt_1[1] < rect_top_right[1]) and |  | ||||||
| 		(rect_bottom_left[0] <= line_pt_2[0] and line_pt_2[0] < rect_top_right[0]) and |  | ||||||
| 		(rect_bottom_left[1] <= line_pt_2[1] and line_pt_2[1] < rect_top_right[1])): |  | ||||||
| 		return line_pt_1, line_pt_2 |  | ||||||
|  |  | ||||||
| 	ts.append( float(rect_bottom_left[0]-line_pt_1[0])/(line_pt_2[0]-line_pt_1[0]) ) |  | ||||||
| 	ts.append( float(rect_top_right[0]-line_pt_1[0])/(line_pt_2[0]-line_pt_1[0]) ) |  | ||||||
| 	ts.append( float(rect_bottom_left[1]-line_pt_1[1])/(line_pt_2[1]-line_pt_1[1]) ) |  | ||||||
| 	ts.append( float(rect_top_right[1]-line_pt_1[1])/(line_pt_2[1]-line_pt_1[1]) ) |  | ||||||
| 	 |  | ||||||
| 	ts.sort() |  | ||||||
| 	if ts[2] < 0 or ts[2] >= 1 or ts[3] < 0 or ts[2]>= 1: |  | ||||||
| 		return None |  | ||||||
| 	result = [(pt_1 + t*(pt_2-pt_1)) for t in (ts[2],ts[3]) for (pt_1, pt_2) in zip(line_pt_1, line_pt_2)] |  | ||||||
| 	return (result[0],result[1]), (result[2], result[3]) |  | ||||||
| 	 |  | ||||||
|  |  | ||||||
|  |  | ||||||
| def plot(*args,**flags): |  | ||||||
| 	limit_flags_names = set(["min_x","min_y","max_x","max_y"]) |  | ||||||
| 	limit_flags = dict([(n,flags[n]) for n in limit_flags_names & set(flags)]) |  | ||||||
| 	settting_flags = dict([(n,flags[n]) for n in set(flags) - limit_flags_names]) |  | ||||||
| 	 |  | ||||||
| 	if len(args) == 1: |  | ||||||
| 		p = Plotter(**settting_flags) |  | ||||||
| 		print p.plot_single(args[0],**limit_flags) |  | ||||||
| 	elif len(args) == 2: |  | ||||||
| 		p = Plotter(**settting_flags) |  | ||||||
| 		print p.plot_double(args[0],args[1],**limit_flags) |  | ||||||
| 	else: |  | ||||||
| 		raise NotImplementedError("can't draw multiple graphs yet") |  | ||||||
| 	 |  | ||||||
| __all__ = ["Plotter","plot"] |  | ||||||
|  |  | ||||||
		Reference in New Issue
	
	Block a user