WIP db
This commit is contained in:
		
							parent
							
								
									d7800f6337
								
							
						
					
					
						commit
						790f29d4ba
					
				
							
								
								
									
										8
									
								
								docs/running.md
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										8
									
								
								docs/running.md
									
									
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,8 @@ | ||||||
|  | # How to Run the Transit Relay | ||||||
|  | 
 | ||||||
|  | ``` | ||||||
|  | pip install magic-wormhole-transit-relay | ||||||
|  | twist wormhole-transit-relay --port tcp:4001 | ||||||
|  | ``` | ||||||
|  | 
 | ||||||
|  | The relay runs as a twist/twistd plugin. To | ||||||
							
								
								
									
										126
									
								
								src/wormhole_transit_relay/database.py
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										126
									
								
								src/wormhole_transit_relay/database.py
									
									
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,126 @@ | ||||||
|  | from __future__ import unicode_literals | ||||||
|  | import os | ||||||
|  | import sqlite3 | ||||||
|  | import tempfile | ||||||
|  | from pkg_resources import resource_string | ||||||
|  | from twisted.python import log | ||||||
|  | 
 | ||||||
|  | class DBError(Exception): | ||||||
|  |     pass | ||||||
|  | 
 | ||||||
|  | def get_schema(version): | ||||||
|  |     schema_bytes = resource_string("wormhole.server", | ||||||
|  |                                    "db-schemas/v%d.sql" % version) | ||||||
|  |     return schema_bytes.decode("utf-8") | ||||||
|  | 
 | ||||||
|  | def get_upgrader(new_version): | ||||||
|  |     schema_bytes = resource_string("wormhole.server", | ||||||
|  |                                    "db-schemas/upgrade-to-v%d.sql" % new_version) | ||||||
|  |     return schema_bytes.decode("utf-8") | ||||||
|  | 
 | ||||||
|  | TARGET_VERSION = 3 | ||||||
|  | 
 | ||||||
|  | def dict_factory(cursor, row): | ||||||
|  |     d = {} | ||||||
|  |     for idx, col in enumerate(cursor.description): | ||||||
|  |         d[col[0]] = row[idx] | ||||||
|  |     return d | ||||||
|  | 
 | ||||||
|  | def _initialize_db_schema(db, target_version): | ||||||
|  |     """Creates the application schema in the given database. | ||||||
|  |     """ | ||||||
|  |     log.msg("populating new database with schema v%s" % target_version) | ||||||
|  |     schema = get_schema(target_version) | ||||||
|  |     db.executescript(schema) | ||||||
|  |     db.execute("INSERT INTO version (version) VALUES (?)", | ||||||
|  |                (target_version,)) | ||||||
|  |     db.commit() | ||||||
|  | 
 | ||||||
|  | def _initialize_db_connection(db): | ||||||
|  |     """Sets up the db connection object with a row factory and with necessary | ||||||
|  |     foreign key settings. | ||||||
|  |     """ | ||||||
|  |     db.row_factory = dict_factory | ||||||
|  |     db.execute("PRAGMA foreign_keys = ON") | ||||||
|  |     problems = db.execute("PRAGMA foreign_key_check").fetchall() | ||||||
|  |     if problems: | ||||||
|  |         raise DBError("failed foreign key check: %s" % (problems,)) | ||||||
|  | 
 | ||||||
|  | def _open_db_connection(dbfile): | ||||||
|  |     """Open a new connection to the SQLite3 database at the given path. | ||||||
|  |     """ | ||||||
|  |     try: | ||||||
|  |         db = sqlite3.connect(dbfile) | ||||||
|  |     except (EnvironmentError, sqlite3.OperationalError) as e: | ||||||
|  |         raise DBError("Unable to create/open db file %s: %s" % (dbfile, e)) | ||||||
|  |     _initialize_db_connection(db) | ||||||
|  |     return db | ||||||
|  | 
 | ||||||
|  | def _get_temporary_dbfile(dbfile): | ||||||
|  |     """Get a temporary filename near the given path. | ||||||
|  |     """ | ||||||
|  |     fd, name = tempfile.mkstemp( | ||||||
|  |         prefix=os.path.basename(dbfile) + ".", | ||||||
|  |         dir=os.path.dirname(dbfile) | ||||||
|  |     ) | ||||||
|  |     os.close(fd) | ||||||
|  |     return name | ||||||
|  | 
 | ||||||
|  | def _atomic_create_and_initialize_db(dbfile, target_version): | ||||||
|  |     """Create and return a new database, initialized with the application | ||||||
|  |     schema. | ||||||
|  | 
 | ||||||
|  |     If anything goes wrong, nothing is left at the ``dbfile`` path. | ||||||
|  |     """ | ||||||
|  |     temp_dbfile = _get_temporary_dbfile(dbfile) | ||||||
|  |     db = _open_db_connection(temp_dbfile) | ||||||
|  |     _initialize_db_schema(db, target_version) | ||||||
|  |     db.close() | ||||||
|  |     os.rename(temp_dbfile, dbfile) | ||||||
|  |     return _open_db_connection(dbfile) | ||||||
|  | 
 | ||||||
|  | def get_db(dbfile, target_version=TARGET_VERSION): | ||||||
|  |     """Open or create the given db file. The parent directory must exist. | ||||||
|  |     Returns the db connection object, or raises DBError. | ||||||
|  |     """ | ||||||
|  |     if dbfile == ":memory:": | ||||||
|  |         db = _open_db_connection(dbfile) | ||||||
|  |         _initialize_db_schema(db, target_version) | ||||||
|  |     elif os.path.exists(dbfile): | ||||||
|  |         db = _open_db_connection(dbfile) | ||||||
|  |     else: | ||||||
|  |         db = _atomic_create_and_initialize_db(dbfile, target_version) | ||||||
|  | 
 | ||||||
|  |     try: | ||||||
|  |         version = db.execute("SELECT version FROM version").fetchone()["version"] | ||||||
|  |     except sqlite3.DatabaseError as e: | ||||||
|  |         # this indicates that the file is not a compatible database format. | ||||||
|  |         # Perhaps it was created with an old version, or it might be junk. | ||||||
|  |         raise DBError("db file is unusable: %s" % e) | ||||||
|  | 
 | ||||||
|  |     while version < target_version: | ||||||
|  |         log.msg(" need to upgrade from %s to %s" % (version, target_version)) | ||||||
|  |         try: | ||||||
|  |             upgrader = get_upgrader(version+1) | ||||||
|  |         except ValueError: # ResourceError?? | ||||||
|  |             log.msg(" unable to upgrade %s to %s" % (version, version+1)) | ||||||
|  |             raise DBError("Unable to upgrade %s to version %s, left at %s" | ||||||
|  |                           % (dbfile, version+1, version)) | ||||||
|  |         log.msg(" executing upgrader v%s->v%s" % (version, version+1)) | ||||||
|  |         db.executescript(upgrader) | ||||||
|  |         db.commit() | ||||||
|  |         version = version+1 | ||||||
|  | 
 | ||||||
|  |     if version != target_version: | ||||||
|  |         raise DBError("Unable to handle db version %s" % version) | ||||||
|  | 
 | ||||||
|  |     return db | ||||||
|  | 
 | ||||||
|  | def dump_db(db): | ||||||
|  |     # to let _iterdump work, we need to restore the original row factory | ||||||
|  |     orig = db.row_factory | ||||||
|  |     try: | ||||||
|  |         db.row_factory = sqlite3.Row | ||||||
|  |         return "".join(db.iterdump()) | ||||||
|  |     finally: | ||||||
|  |         db.row_factory = orig | ||||||
							
								
								
									
										30
									
								
								src/wormhole_transit_relay/db-schemas/v1.sql
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										30
									
								
								src/wormhole_transit_relay/db-schemas/v1.sql
									
									
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,30 @@ | ||||||
|  | 
 | ||||||
|  | CREATE TABLE `version` -- contains one row | ||||||
|  | ( | ||||||
|  |  `version` INTEGER -- set to 1 | ||||||
|  | ); | ||||||
|  | 
 | ||||||
|  | 
 | ||||||
|  | CREATE TABLE `current` -- contains one row | ||||||
|  | ( | ||||||
|  |  `reboot` INTEGER, -- seconds since epoch of most recent reboot | ||||||
|  |  `last_update` INTEGER, -- when `current` was last updated | ||||||
|  |  `connected` INTEGER, -- number of current paired connections | ||||||
|  |  `waiting` INTEGER, -- number of not-yet-paired connections | ||||||
|  |  `incomplete_bytes` INTEGER -- bytes sent through not-yet-complete connections | ||||||
|  | ); | ||||||
|  | 
 | ||||||
|  | CREATE TABLE `usage` | ||||||
|  | ( | ||||||
|  |  `started` INTEGER, -- seconds since epoch, rounded to "blur time" | ||||||
|  |  `total_time` INTEGER, -- seconds from open to last close | ||||||
|  |  `waiting_time` INTEGER, -- seconds from start to 2nd side appearing, or None | ||||||
|  |  `total_bytes` INTEGER, -- total bytes relayed (both directions) | ||||||
|  |  `result` VARCHAR -- happy, scary, lonely, errory, pruney | ||||||
|  |  -- transit moods: | ||||||
|  |  --  "errory": one side gave the wrong handshake | ||||||
|  |  --  "lonely": good handshake, but the other side never showed up | ||||||
|  |  --  "happy": both sides gave correct handshake | ||||||
|  | ); | ||||||
|  | CREATE INDEX `transit_usage_idx` ON `transit_usage` (`started`); | ||||||
|  | CREATE INDEX `transit_usage_result_idx` ON `transit_usage` (`result`); | ||||||
|  | @ -9,10 +9,10 @@ This plugin sets up a 'Transit Relay' server for magic-wormhole. This service | ||||||
| listens for TCP connections, finds pairs which present the same handshake, and | listens for TCP connections, finds pairs which present the same handshake, and | ||||||
| glues the two TCP sockets together. | glues the two TCP sockets together. | ||||||
| 
 | 
 | ||||||
| If --usage-logfile= is provided, a line will be written to the given file after | If --log-stdout is provided, a line will be written to stdout after each | ||||||
| each connection is done. This line will be a complete JSON object (starting | connection is done. This line will be a complete JSON object (starting with | ||||||
| with "{", ending with "}\n", and containing no internal newlines). The keys | "{", ending with "}\n", and containing no internal newlines). The keys will | ||||||
| will be: | be: | ||||||
| 
 | 
 | ||||||
| * 'started': number, seconds since epoch | * 'started': number, seconds since epoch | ||||||
| * 'total_time': number, seconds from open to last close | * 'total_time': number, seconds from open to last close | ||||||
|  | @ -27,35 +27,62 @@ second matching side never appeared (and thus 'waiting_time' will be null). | ||||||
| If --blur-usage= is provided, then 'started' will be rounded to the given time | If --blur-usage= is provided, then 'started' will be rounded to the given time | ||||||
| interval, and 'total_bytes' will be rounded as well. | interval, and 'total_bytes' will be rounded as well. | ||||||
| 
 | 
 | ||||||
| If --stats-file is provided, the server will periodically write a simple JSON | If --usage-db= is provided, the server will maintain a SQLite database in the | ||||||
| dictionary to that file (atomically), with cumulative usage data (since last | given file. Current, recent, and historical usage data will be written to the | ||||||
| reboot, and all-time). This information is *not* blurred (the assumption is | database, and external tools can query the DB for metrics: the munin plugins | ||||||
| that it will be overwritten on a regular basis, and is aggregated anyways). The | in misc/ may be useful. Timestamps and sizes in this file will respect | ||||||
| keys are: | --blur-usage. The four tables are: | ||||||
| 
 | 
 | ||||||
| * active.connected: number of paired connections | "current" contains a single row, with these columns: | ||||||
| * active.waiting: number of not-yet-paired connections |  | ||||||
| * since_reboot.bytes: sum of 'total_bytes' |  | ||||||
| * since_reboot.total: number of completed connections |  | ||||||
| * since_reboot.moods: dict mapping mood string to number of connections |  | ||||||
| * all_time.bytes: same |  | ||||||
| * all_time.total |  | ||||||
| * all_time.moods |  | ||||||
| 
 | 
 | ||||||
| The server will write twistd.pid and twistd.log files as usual, if daemonized | * connected: number of paired connections | ||||||
| by twistd. twistd.log will only contain startup, shutdown, and exception | * waiting: number of not-yet-paired connections | ||||||
| messages. To record information about each connection, use --usage-logfile. | * partal_bytes: bytes transmitted over not-yet-complete connections | ||||||
|  | 
 | ||||||
|  | "since_reboot" contains a single row, with these columns: | ||||||
|  | 
 | ||||||
|  | * bytes: sum of 'total_bytes' | ||||||
|  | * connections: number of completed connections | ||||||
|  | * mood_happy: count of connections that finished "happy": both sides gave correct handshake | ||||||
|  | * mood_lonely: one side gave good handshake, other side never showed up | ||||||
|  | * mood_errory: one side gave a bad handshake | ||||||
|  | 
 | ||||||
|  | "all_time" contains a single row, with these columns: | ||||||
|  | 
 | ||||||
|  | * bytes: | ||||||
|  | * connections: | ||||||
|  | * mood_happy: | ||||||
|  | * mood_lonely: | ||||||
|  | * mood_errory: | ||||||
|  | 
 | ||||||
|  | "usage" contains one row per closed connection, with these columns: | ||||||
|  | 
 | ||||||
|  | * started: seconds since epoch, rounded to "blur time" | ||||||
|  | * total_time: seconds from first open to last close | ||||||
|  | * waiting_time: seconds from first open to second open, or None | ||||||
|  | * bytes: total bytes relayed (in both directions) | ||||||
|  | * result: (string) the mood: happy, lonely, errory | ||||||
|  | 
 | ||||||
|  | All tables will be updated after each connection is finished. In addition, | ||||||
|  | the "current" table will be updated at least once every 5 minutes. | ||||||
|  | 
 | ||||||
|  | If daemonized by twistd, the server will write twistd.pid and twistd.log | ||||||
|  | files as usual. By default twistd.log will only contain startup, shutdown, | ||||||
|  | and exception messages. Adding --log-stdout will add per-connection JSON | ||||||
|  | lines to twistd.log. | ||||||
| """ | """ | ||||||
| 
 | 
 | ||||||
| class Options(usage.Options): | class Options(usage.Options): | ||||||
|     #synopsis = "[--port=] [--usage-logfile=] [--blur-usage=] [--stats-json=]" |     #synopsis = "[--port=] [--log-stdout] [--blur-usage=] [--usage-db=]" | ||||||
|     longdesc = LONGDESC |     longdesc = LONGDESC | ||||||
| 
 | 
 | ||||||
|  |     optFlags = { | ||||||
|  |         ("log-stdout", None, "write JSON usage logs to stdout"), | ||||||
|  |         } | ||||||
|     optParameters = [ |     optParameters = [ | ||||||
|         ("port", "p", "tcp:4001", "endpoint to listen on"), |         ("port", "p", "tcp:4001", "endpoint to listen on"), | ||||||
|         ("blur-usage", None, None, "blur timestamps and data sizes in logs"), |         ("blur-usage", None, None, "blur timestamps and data sizes in logs"), | ||||||
|         ("usage-logfile", None, None, "record usage data (JSON lines)"), |         ("usage-db", None, None, "record usage data (SQLite)"), | ||||||
|         ("stats-file", None, None, "record usage in JSON format"), |  | ||||||
|         ] |         ] | ||||||
| 
 | 
 | ||||||
|     def opt_blur_usage(self, arg): |     def opt_blur_usage(self, arg): | ||||||
|  | @ -65,6 +92,6 @@ class Options(usage.Options): | ||||||
| def makeService(config, reactor=reactor): | def makeService(config, reactor=reactor): | ||||||
|     ep = endpoints.serverFromString(reactor, config["port"]) # to listen |     ep = endpoints.serverFromString(reactor, config["port"]) # to listen | ||||||
|     f = transit_server.Transit(blur_usage=config["blur-usage"], |     f = transit_server.Transit(blur_usage=config["blur-usage"], | ||||||
|                                usage_logfile=config["usage-logfile"], |                                log_stdout=config["log-stdout"], | ||||||
|                                stats_file=config["stats-file"]) |                                usage_db=config["usage-db"]) | ||||||
|     return StreamServerEndpointService(ep, f) |     return StreamServerEndpointService(ep, f) | ||||||
|  |  | ||||||
|  | @ -2,6 +2,7 @@ from __future__ import print_function, unicode_literals | ||||||
| import os, re, time, json | import os, re, time, json | ||||||
| from twisted.python import log | from twisted.python import log | ||||||
| from twisted.internet import protocol | from twisted.internet import protocol | ||||||
|  | from .database import get_db | ||||||
| 
 | 
 | ||||||
| SECONDS = 1.0 | SECONDS = 1.0 | ||||||
| MINUTE = 60*SECONDS | MINUTE = 60*SECONDS | ||||||
|  |  | ||||||
		Loading…
	
		Reference in New Issue
	
	Block a user